zig

fork of https://codeberg.org/ziglang/zig
Log | Files | Refs | README | LICENSE

arm_neon.h (2788713B) - Raw


      1 /*===---- arm_neon.h - ARM Neon intrinsics ---------------------------------===
      2  *
      3  * Permission is hereby granted, free of charge, to any person obtaining a copy
      4  * of this software and associated documentation files (the "Software"), to deal
      5  * in the Software without restriction, including without limitation the rights
      6  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
      7  * copies of the Software, and to permit persons to whom the Software is
      8  * furnished to do so, subject to the following conditions:
      9  *
     10  * The above copyright notice and this permission notice shall be included in
     11  * all copies or substantial portions of the Software.
     12  *
     13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     15  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
     16  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
     17  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
     18  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
     19  * THE SOFTWARE.
     20  *
     21  *===-----------------------------------------------------------------------===
     22  */
     23 
     24 #ifndef __ARM_NEON_H
     25 #define __ARM_NEON_H
     26 
     27 #ifndef __ARM_FP
     28 #error "NEON intrinsics not available with the soft-float ABI. Please use -mfloat-abi=softfp or -mfloat-abi=hard"
     29 #else
     30 
     31 #include <stdint.h>
     32 
     33 #include <arm_bf16.h>
     34 #include <arm_vector_types.h>
     35 #if defined(__aarch64__) || defined(__arm64ec__)
     36 typedef uint8_t poly8_t;
     37 typedef uint16_t poly16_t;
     38 typedef uint64_t poly64_t;
     39 typedef __uint128_t poly128_t;
     40 #else
     41 typedef int8_t poly8_t;
     42 typedef int16_t poly16_t;
     43 typedef int64_t poly64_t;
     44 #endif
     45 typedef __attribute__((neon_polyvector_type(8))) poly8_t poly8x8_t;
     46 typedef __attribute__((neon_polyvector_type(16))) poly8_t poly8x16_t;
     47 typedef __attribute__((neon_polyvector_type(4))) poly16_t poly16x4_t;
     48 typedef __attribute__((neon_polyvector_type(8))) poly16_t poly16x8_t;
     49 typedef __attribute__((neon_polyvector_type(1))) poly64_t poly64x1_t;
     50 typedef __attribute__((neon_polyvector_type(2))) poly64_t poly64x2_t;
     51 
     52 typedef struct poly8x8x2_t {
     53   poly8x8_t val[2];
     54 } poly8x8x2_t;
     55 
     56 typedef struct poly8x16x2_t {
     57   poly8x16_t val[2];
     58 } poly8x16x2_t;
     59 
     60 typedef struct poly16x4x2_t {
     61   poly16x4_t val[2];
     62 } poly16x4x2_t;
     63 
     64 typedef struct poly16x8x2_t {
     65   poly16x8_t val[2];
     66 } poly16x8x2_t;
     67 
     68 typedef struct poly64x1x2_t {
     69   poly64x1_t val[2];
     70 } poly64x1x2_t;
     71 
     72 typedef struct poly64x2x2_t {
     73   poly64x2_t val[2];
     74 } poly64x2x2_t;
     75 
     76 typedef struct poly8x8x3_t {
     77   poly8x8_t val[3];
     78 } poly8x8x3_t;
     79 
     80 typedef struct poly8x16x3_t {
     81   poly8x16_t val[3];
     82 } poly8x16x3_t;
     83 
     84 typedef struct poly16x4x3_t {
     85   poly16x4_t val[3];
     86 } poly16x4x3_t;
     87 
     88 typedef struct poly16x8x3_t {
     89   poly16x8_t val[3];
     90 } poly16x8x3_t;
     91 
     92 typedef struct poly64x1x3_t {
     93   poly64x1_t val[3];
     94 } poly64x1x3_t;
     95 
     96 typedef struct poly64x2x3_t {
     97   poly64x2_t val[3];
     98 } poly64x2x3_t;
     99 
    100 typedef struct poly8x8x4_t {
    101   poly8x8_t val[4];
    102 } poly8x8x4_t;
    103 
    104 typedef struct poly8x16x4_t {
    105   poly8x16_t val[4];
    106 } poly8x16x4_t;
    107 
    108 typedef struct poly16x4x4_t {
    109   poly16x4_t val[4];
    110 } poly16x4x4_t;
    111 
    112 typedef struct poly16x8x4_t {
    113   poly16x8_t val[4];
    114 } poly16x8x4_t;
    115 
    116 typedef struct poly64x1x4_t {
    117   poly64x1_t val[4];
    118 } poly64x1x4_t;
    119 
    120 typedef struct poly64x2x4_t {
    121   poly64x2_t val[4];
    122 } poly64x2x4_t;
    123 
    124 #define __ai static __inline__ __attribute__((__always_inline__, __nodebug__))
    125 
    126 #ifdef __LITTLE_ENDIAN__
    127 #define splatq_lane_bf16(__p0, __p1) __extension__ ({ \
    128   bfloat16x8_t __ret; \
    129   bfloat16x4_t __s0 = __p0; \
    130   __ret = (bfloat16x8_t) __builtin_neon_splatq_lane_bf16((int8x8_t)__s0, __p1, 11); \
    131   __ret; \
    132 })
    133 #else
    134 #define splatq_lane_bf16(__p0, __p1) __extension__ ({ \
    135   bfloat16x8_t __ret; \
    136   bfloat16x4_t __s0 = __p0; \
    137   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
    138   __ret = (bfloat16x8_t) __builtin_neon_splatq_lane_bf16((int8x8_t)__rev0, __p1, 11); \
    139   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
    140   __ret; \
    141 })
    142 #define __noswap_splatq_lane_bf16(__p0, __p1) __extension__ ({ \
    143   bfloat16x8_t __ret; \
    144   bfloat16x4_t __s0 = __p0; \
    145   __ret = (bfloat16x8_t) __builtin_neon_splatq_lane_bf16((int8x8_t)__s0, __p1, 11); \
    146   __ret; \
    147 })
    148 #endif
    149 
    150 #ifdef __LITTLE_ENDIAN__
    151 #define splat_lane_bf16(__p0, __p1) __extension__ ({ \
    152   bfloat16x4_t __ret; \
    153   bfloat16x4_t __s0 = __p0; \
    154   __ret = (bfloat16x4_t) __builtin_neon_splat_lane_bf16((int8x8_t)__s0, __p1, 11); \
    155   __ret; \
    156 })
    157 #else
    158 #define splat_lane_bf16(__p0, __p1) __extension__ ({ \
    159   bfloat16x4_t __ret; \
    160   bfloat16x4_t __s0 = __p0; \
    161   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
    162   __ret = (bfloat16x4_t) __builtin_neon_splat_lane_bf16((int8x8_t)__rev0, __p1, 11); \
    163   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
    164   __ret; \
    165 })
    166 #define __noswap_splat_lane_bf16(__p0, __p1) __extension__ ({ \
    167   bfloat16x4_t __ret; \
    168   bfloat16x4_t __s0 = __p0; \
    169   __ret = (bfloat16x4_t) __builtin_neon_splat_lane_bf16((int8x8_t)__s0, __p1, 11); \
    170   __ret; \
    171 })
    172 #endif
    173 
    174 #ifdef __LITTLE_ENDIAN__
    175 #define splatq_laneq_bf16(__p0, __p1) __extension__ ({ \
    176   bfloat16x8_t __ret; \
    177   bfloat16x8_t __s0 = __p0; \
    178   __ret = (bfloat16x8_t) __builtin_neon_splatq_laneq_bf16((int8x16_t)__s0, __p1, 43); \
    179   __ret; \
    180 })
    181 #else
    182 #define splatq_laneq_bf16(__p0, __p1) __extension__ ({ \
    183   bfloat16x8_t __ret; \
    184   bfloat16x8_t __s0 = __p0; \
    185   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
    186   __ret = (bfloat16x8_t) __builtin_neon_splatq_laneq_bf16((int8x16_t)__rev0, __p1, 43); \
    187   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
    188   __ret; \
    189 })
    190 #define __noswap_splatq_laneq_bf16(__p0, __p1) __extension__ ({ \
    191   bfloat16x8_t __ret; \
    192   bfloat16x8_t __s0 = __p0; \
    193   __ret = (bfloat16x8_t) __builtin_neon_splatq_laneq_bf16((int8x16_t)__s0, __p1, 43); \
    194   __ret; \
    195 })
    196 #endif
    197 
    198 #ifdef __LITTLE_ENDIAN__
    199 #define splat_laneq_bf16(__p0, __p1) __extension__ ({ \
    200   bfloat16x4_t __ret; \
    201   bfloat16x8_t __s0 = __p0; \
    202   __ret = (bfloat16x4_t) __builtin_neon_splat_laneq_bf16((int8x16_t)__s0, __p1, 43); \
    203   __ret; \
    204 })
    205 #else
    206 #define splat_laneq_bf16(__p0, __p1) __extension__ ({ \
    207   bfloat16x4_t __ret; \
    208   bfloat16x8_t __s0 = __p0; \
    209   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
    210   __ret = (bfloat16x4_t) __builtin_neon_splat_laneq_bf16((int8x16_t)__rev0, __p1, 43); \
    211   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
    212   __ret; \
    213 })
    214 #define __noswap_splat_laneq_bf16(__p0, __p1) __extension__ ({ \
    215   bfloat16x4_t __ret; \
    216   bfloat16x8_t __s0 = __p0; \
    217   __ret = (bfloat16x4_t) __builtin_neon_splat_laneq_bf16((int8x16_t)__s0, __p1, 43); \
    218   __ret; \
    219 })
    220 #endif
    221 
    222 #ifdef __LITTLE_ENDIAN__
    223 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfdotq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    224   float32x4_t __ret;
    225   __ret = (float32x4_t) __builtin_neon_vbfdotq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    226   return __ret;
    227 }
    228 #else
    229 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfdotq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    230   float32x4_t __ret;
    231   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
    232   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
    233   bfloat16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
    234   __ret = (float32x4_t) __builtin_neon_vbfdotq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
    235   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    236   return __ret;
    237 }
    238 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vbfdotq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    239   float32x4_t __ret;
    240   __ret = (float32x4_t) __builtin_neon_vbfdotq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    241   return __ret;
    242 }
    243 #endif
    244 
    245 #ifdef __LITTLE_ENDIAN__
    246 __ai __attribute__((target("bf16,neon"))) float32x2_t vbfdot_f32(float32x2_t __p0, bfloat16x4_t __p1, bfloat16x4_t __p2) {
    247   float32x2_t __ret;
    248   __ret = (float32x2_t) __builtin_neon_vbfdot_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
    249   return __ret;
    250 }
    251 #else
    252 __ai __attribute__((target("bf16,neon"))) float32x2_t vbfdot_f32(float32x2_t __p0, bfloat16x4_t __p1, bfloat16x4_t __p2) {
    253   float32x2_t __ret;
    254   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
    255   bfloat16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
    256   bfloat16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
    257   __ret = (float32x2_t) __builtin_neon_vbfdot_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
    258   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
    259   return __ret;
    260 }
    261 __ai __attribute__((target("bf16,neon"))) float32x2_t __noswap_vbfdot_f32(float32x2_t __p0, bfloat16x4_t __p1, bfloat16x4_t __p2) {
    262   float32x2_t __ret;
    263   __ret = (float32x2_t) __builtin_neon_vbfdot_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
    264   return __ret;
    265 }
    266 #endif
    267 
    268 #ifdef __LITTLE_ENDIAN__
    269 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlalbq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    270   float32x4_t __ret;
    271   __ret = (float32x4_t) __builtin_neon_vbfmlalbq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    272   return __ret;
    273 }
    274 #else
    275 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlalbq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    276   float32x4_t __ret;
    277   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
    278   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
    279   bfloat16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
    280   __ret = (float32x4_t) __builtin_neon_vbfmlalbq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
    281   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    282   return __ret;
    283 }
    284 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vbfmlalbq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    285   float32x4_t __ret;
    286   __ret = (float32x4_t) __builtin_neon_vbfmlalbq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    287   return __ret;
    288 }
    289 #endif
    290 
    291 #ifdef __LITTLE_ENDIAN__
    292 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlaltq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    293   float32x4_t __ret;
    294   __ret = (float32x4_t) __builtin_neon_vbfmlaltq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    295   return __ret;
    296 }
    297 #else
    298 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlaltq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    299   float32x4_t __ret;
    300   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
    301   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
    302   bfloat16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
    303   __ret = (float32x4_t) __builtin_neon_vbfmlaltq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
    304   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    305   return __ret;
    306 }
    307 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vbfmlaltq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    308   float32x4_t __ret;
    309   __ret = (float32x4_t) __builtin_neon_vbfmlaltq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    310   return __ret;
    311 }
    312 #endif
    313 
    314 #ifdef __LITTLE_ENDIAN__
    315 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmmlaq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    316   float32x4_t __ret;
    317   __ret = (float32x4_t) __builtin_neon_vbfmmlaq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
    318   return __ret;
    319 }
    320 #else
    321 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmmlaq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) {
    322   float32x4_t __ret;
    323   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
    324   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
    325   bfloat16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
    326   __ret = (float32x4_t) __builtin_neon_vbfmmlaq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
    327   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    328   return __ret;
    329 }
    330 #endif
    331 
    332 #ifdef __LITTLE_ENDIAN__
    333 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcombine_bf16(bfloat16x4_t __p0, bfloat16x4_t __p1) {
    334   bfloat16x8_t __ret;
    335   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
    336   return __ret;
    337 }
    338 #else
    339 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcombine_bf16(bfloat16x4_t __p0, bfloat16x4_t __p1) {
    340   bfloat16x8_t __ret;
    341   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
    342   bfloat16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
    343   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7);
    344   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
    345   return __ret;
    346 }
    347 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t __noswap_vcombine_bf16(bfloat16x4_t __p0, bfloat16x4_t __p1) {
    348   bfloat16x8_t __ret;
    349   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
    350   return __ret;
    351 }
    352 #endif
    353 
    354 #define vcreate_bf16(__p0) __extension__ ({ \
    355   bfloat16x4_t __ret; \
    356   uint64_t __promote = __p0; \
    357   __ret = (bfloat16x4_t)(__promote); \
    358   __ret; \
    359 })
    360 __ai __attribute__((target("bf16,neon"))) float32_t vcvtah_f32_bf16(bfloat16_t __p0) {
    361   float32_t __ret;
    362   __ret = __builtin_bit_cast(float32_t, (uint32_t)(__builtin_bit_cast(uint16_t, __p0)) << 16);
    363   return __ret;
    364 }
    365 __ai __attribute__((target("bf16,neon"))) bfloat16_t vcvth_bf16_f32(float32_t __p0) {
    366   bfloat16_t __ret;
    367   __ret = (bfloat16_t) __builtin_neon_vcvth_bf16_f32(__p0);
    368   return __ret;
    369 }
    370 #ifdef __LITTLE_ENDIAN__
    371 #define vduph_lane_bf16(__p0, __p1) __extension__ ({ \
    372   bfloat16_t __ret; \
    373   bfloat16x4_t __s0 = __p0; \
    374   __ret = (bfloat16_t) __builtin_neon_vduph_lane_bf16((bfloat16x4_t)__s0, __p1); \
    375   __ret; \
    376 })
    377 #else
    378 #define vduph_lane_bf16(__p0, __p1) __extension__ ({ \
    379   bfloat16_t __ret; \
    380   bfloat16x4_t __s0 = __p0; \
    381   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
    382   __ret = (bfloat16_t) __builtin_neon_vduph_lane_bf16((bfloat16x4_t)__rev0, __p1); \
    383   __ret; \
    384 })
    385 #endif
    386 
    387 #ifdef __LITTLE_ENDIAN__
    388 #define vdupq_lane_bf16(__p0_0, __p1_0) __extension__ ({ \
    389   bfloat16x8_t __ret_0; \
    390   bfloat16x4_t __s0_0 = __p0_0; \
    391   __ret_0 = splatq_lane_bf16(__s0_0, __p1_0); \
    392   __ret_0; \
    393 })
    394 #else
    395 #define vdupq_lane_bf16(__p0_1, __p1_1) __extension__ ({ \
    396   bfloat16x8_t __ret_1; \
    397   bfloat16x4_t __s0_1 = __p0_1; \
    398   bfloat16x4_t __rev0_1;  __rev0_1 = __builtin_shufflevector(__s0_1, __s0_1, 3, 2, 1, 0); \
    399   __ret_1 = __noswap_splatq_lane_bf16(__rev0_1, __p1_1); \
    400   __ret_1 = __builtin_shufflevector(__ret_1, __ret_1, 7, 6, 5, 4, 3, 2, 1, 0); \
    401   __ret_1; \
    402 })
    403 #endif
    404 
    405 #ifdef __LITTLE_ENDIAN__
    406 #define vdup_lane_bf16(__p0_2, __p1_2) __extension__ ({ \
    407   bfloat16x4_t __ret_2; \
    408   bfloat16x4_t __s0_2 = __p0_2; \
    409   __ret_2 = splat_lane_bf16(__s0_2, __p1_2); \
    410   __ret_2; \
    411 })
    412 #else
    413 #define vdup_lane_bf16(__p0_3, __p1_3) __extension__ ({ \
    414   bfloat16x4_t __ret_3; \
    415   bfloat16x4_t __s0_3 = __p0_3; \
    416   bfloat16x4_t __rev0_3;  __rev0_3 = __builtin_shufflevector(__s0_3, __s0_3, 3, 2, 1, 0); \
    417   __ret_3 = __noswap_splat_lane_bf16(__rev0_3, __p1_3); \
    418   __ret_3 = __builtin_shufflevector(__ret_3, __ret_3, 3, 2, 1, 0); \
    419   __ret_3; \
    420 })
    421 #endif
    422 
    423 #ifdef __LITTLE_ENDIAN__
    424 #define vduph_laneq_bf16(__p0, __p1) __extension__ ({ \
    425   bfloat16_t __ret; \
    426   bfloat16x8_t __s0 = __p0; \
    427   __ret = (bfloat16_t) __builtin_neon_vduph_laneq_bf16((bfloat16x8_t)__s0, __p1); \
    428   __ret; \
    429 })
    430 #else
    431 #define vduph_laneq_bf16(__p0, __p1) __extension__ ({ \
    432   bfloat16_t __ret; \
    433   bfloat16x8_t __s0 = __p0; \
    434   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
    435   __ret = (bfloat16_t) __builtin_neon_vduph_laneq_bf16((bfloat16x8_t)__rev0, __p1); \
    436   __ret; \
    437 })
    438 #endif
    439 
    440 #ifdef __LITTLE_ENDIAN__
    441 #define vdupq_laneq_bf16(__p0_4, __p1_4) __extension__ ({ \
    442   bfloat16x8_t __ret_4; \
    443   bfloat16x8_t __s0_4 = __p0_4; \
    444   __ret_4 = splatq_laneq_bf16(__s0_4, __p1_4); \
    445   __ret_4; \
    446 })
    447 #else
    448 #define vdupq_laneq_bf16(__p0_5, __p1_5) __extension__ ({ \
    449   bfloat16x8_t __ret_5; \
    450   bfloat16x8_t __s0_5 = __p0_5; \
    451   bfloat16x8_t __rev0_5;  __rev0_5 = __builtin_shufflevector(__s0_5, __s0_5, 7, 6, 5, 4, 3, 2, 1, 0); \
    452   __ret_5 = __noswap_splatq_laneq_bf16(__rev0_5, __p1_5); \
    453   __ret_5 = __builtin_shufflevector(__ret_5, __ret_5, 7, 6, 5, 4, 3, 2, 1, 0); \
    454   __ret_5; \
    455 })
    456 #endif
    457 
    458 #ifdef __LITTLE_ENDIAN__
    459 #define vdup_laneq_bf16(__p0_6, __p1_6) __extension__ ({ \
    460   bfloat16x4_t __ret_6; \
    461   bfloat16x8_t __s0_6 = __p0_6; \
    462   __ret_6 = splat_laneq_bf16(__s0_6, __p1_6); \
    463   __ret_6; \
    464 })
    465 #else
    466 #define vdup_laneq_bf16(__p0_7, __p1_7) __extension__ ({ \
    467   bfloat16x4_t __ret_7; \
    468   bfloat16x8_t __s0_7 = __p0_7; \
    469   bfloat16x8_t __rev0_7;  __rev0_7 = __builtin_shufflevector(__s0_7, __s0_7, 7, 6, 5, 4, 3, 2, 1, 0); \
    470   __ret_7 = __noswap_splat_laneq_bf16(__rev0_7, __p1_7); \
    471   __ret_7 = __builtin_shufflevector(__ret_7, __ret_7, 3, 2, 1, 0); \
    472   __ret_7; \
    473 })
    474 #endif
    475 
    476 #ifdef __LITTLE_ENDIAN__
    477 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vdupq_n_bf16(bfloat16_t __p0) {
    478   bfloat16x8_t __ret;
    479   __ret = (bfloat16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
    480   return __ret;
    481 }
    482 #else
    483 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vdupq_n_bf16(bfloat16_t __p0) {
    484   bfloat16x8_t __ret;
    485   __ret = (bfloat16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
    486   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
    487   return __ret;
    488 }
    489 #endif
    490 
    491 #ifdef __LITTLE_ENDIAN__
    492 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vdup_n_bf16(bfloat16_t __p0) {
    493   bfloat16x4_t __ret;
    494   __ret = (bfloat16x4_t) {__p0, __p0, __p0, __p0};
    495   return __ret;
    496 }
    497 #else
    498 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vdup_n_bf16(bfloat16_t __p0) {
    499   bfloat16x4_t __ret;
    500   __ret = (bfloat16x4_t) {__p0, __p0, __p0, __p0};
    501   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    502   return __ret;
    503 }
    504 #endif
    505 
    506 #ifdef __LITTLE_ENDIAN__
    507 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_high_bf16(bfloat16x8_t __p0) {
    508   bfloat16x4_t __ret;
    509   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
    510   return __ret;
    511 }
    512 #else
    513 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_high_bf16(bfloat16x8_t __p0) {
    514   bfloat16x4_t __ret;
    515   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
    516   __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7);
    517   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    518   return __ret;
    519 }
    520 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __noswap_vget_high_bf16(bfloat16x8_t __p0) {
    521   bfloat16x4_t __ret;
    522   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
    523   return __ret;
    524 }
    525 #endif
    526 
    527 #ifdef __LITTLE_ENDIAN__
    528 #define vgetq_lane_bf16(__p0, __p1) __extension__ ({ \
    529   bfloat16_t __ret; \
    530   bfloat16x8_t __s0 = __p0; \
    531   __ret = (bfloat16_t) __builtin_neon_vgetq_lane_bf16((bfloat16x8_t)__s0, __p1); \
    532   __ret; \
    533 })
    534 #else
    535 #define vgetq_lane_bf16(__p0, __p1) __extension__ ({ \
    536   bfloat16_t __ret; \
    537   bfloat16x8_t __s0 = __p0; \
    538   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
    539   __ret = (bfloat16_t) __builtin_neon_vgetq_lane_bf16((bfloat16x8_t)__rev0, __p1); \
    540   __ret; \
    541 })
    542 #define __noswap_vgetq_lane_bf16(__p0, __p1) __extension__ ({ \
    543   bfloat16_t __ret; \
    544   bfloat16x8_t __s0 = __p0; \
    545   __ret = (bfloat16_t) __builtin_neon_vgetq_lane_bf16((bfloat16x8_t)__s0, __p1); \
    546   __ret; \
    547 })
    548 #endif
    549 
    550 #ifdef __LITTLE_ENDIAN__
    551 #define vget_lane_bf16(__p0, __p1) __extension__ ({ \
    552   bfloat16_t __ret; \
    553   bfloat16x4_t __s0 = __p0; \
    554   __ret = (bfloat16_t) __builtin_neon_vget_lane_bf16((bfloat16x4_t)__s0, __p1); \
    555   __ret; \
    556 })
    557 #else
    558 #define vget_lane_bf16(__p0, __p1) __extension__ ({ \
    559   bfloat16_t __ret; \
    560   bfloat16x4_t __s0 = __p0; \
    561   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
    562   __ret = (bfloat16_t) __builtin_neon_vget_lane_bf16((bfloat16x4_t)__rev0, __p1); \
    563   __ret; \
    564 })
    565 #define __noswap_vget_lane_bf16(__p0, __p1) __extension__ ({ \
    566   bfloat16_t __ret; \
    567   bfloat16x4_t __s0 = __p0; \
    568   __ret = (bfloat16_t) __builtin_neon_vget_lane_bf16((bfloat16x4_t)__s0, __p1); \
    569   __ret; \
    570 })
    571 #endif
    572 
    573 #ifdef __LITTLE_ENDIAN__
    574 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_low_bf16(bfloat16x8_t __p0) {
    575   bfloat16x4_t __ret;
    576   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3);
    577   return __ret;
    578 }
    579 #else
    580 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_low_bf16(bfloat16x8_t __p0) {
    581   bfloat16x4_t __ret;
    582   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
    583   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3);
    584   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
    585   return __ret;
    586 }
    587 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __noswap_vget_low_bf16(bfloat16x8_t __p0) {
    588   bfloat16x4_t __ret;
    589   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3);
    590   return __ret;
    591 }
    592 #endif
    593 
    594 #ifdef __LITTLE_ENDIAN__
    595 #define vld1q_bf16(__p0) __extension__ ({ \
    596   bfloat16x8_t __ret; \
    597   __ret = (bfloat16x8_t) __builtin_neon_vld1q_bf16(__p0, 43); \
    598   __ret; \
    599 })
    600 #else
    601 #define vld1q_bf16(__p0) __extension__ ({ \
    602   bfloat16x8_t __ret; \
    603   __ret = (bfloat16x8_t) __builtin_neon_vld1q_bf16(__p0, 43); \
    604   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
    605   __ret; \
    606 })
    607 #endif
    608 
    609 #ifdef __LITTLE_ENDIAN__
    610 #define vld1_bf16(__p0) __extension__ ({ \
    611   bfloat16x4_t __ret; \
    612   __ret = (bfloat16x4_t) __builtin_neon_vld1_bf16(__p0, 11); \
    613   __ret; \
    614 })
    615 #else
    616 #define vld1_bf16(__p0) __extension__ ({ \
    617   bfloat16x4_t __ret; \
    618   __ret = (bfloat16x4_t) __builtin_neon_vld1_bf16(__p0, 11); \
    619   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
    620   __ret; \
    621 })
    622 #endif
    623 
    624 #ifdef __LITTLE_ENDIAN__
    625 #define vld1q_dup_bf16(__p0) __extension__ ({ \
    626   bfloat16x8_t __ret; \
    627   __ret = (bfloat16x8_t) __builtin_neon_vld1q_dup_bf16(__p0, 43); \
    628   __ret; \
    629 })
    630 #else
    631 #define vld1q_dup_bf16(__p0) __extension__ ({ \
    632   bfloat16x8_t __ret; \
    633   __ret = (bfloat16x8_t) __builtin_neon_vld1q_dup_bf16(__p0, 43); \
    634   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
    635   __ret; \
    636 })
    637 #endif
    638 
    639 #ifdef __LITTLE_ENDIAN__
    640 #define vld1_dup_bf16(__p0) __extension__ ({ \
    641   bfloat16x4_t __ret; \
    642   __ret = (bfloat16x4_t) __builtin_neon_vld1_dup_bf16(__p0, 11); \
    643   __ret; \
    644 })
    645 #else
    646 #define vld1_dup_bf16(__p0) __extension__ ({ \
    647   bfloat16x4_t __ret; \
    648   __ret = (bfloat16x4_t) __builtin_neon_vld1_dup_bf16(__p0, 11); \
    649   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
    650   __ret; \
    651 })
    652 #endif
    653 
    654 #ifdef __LITTLE_ENDIAN__
    655 #define vld1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    656   bfloat16x8_t __ret; \
    657   bfloat16x8_t __s1 = __p1; \
    658   __ret = (bfloat16x8_t) __builtin_neon_vld1q_lane_bf16(__p0, (int8x16_t)__s1, __p2, 43); \
    659   __ret; \
    660 })
    661 #else
    662 #define vld1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    663   bfloat16x8_t __ret; \
    664   bfloat16x8_t __s1 = __p1; \
    665   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
    666   __ret = (bfloat16x8_t) __builtin_neon_vld1q_lane_bf16(__p0, (int8x16_t)__rev1, __p2, 43); \
    667   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
    668   __ret; \
    669 })
    670 #endif
    671 
    672 #ifdef __LITTLE_ENDIAN__
    673 #define vld1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    674   bfloat16x4_t __ret; \
    675   bfloat16x4_t __s1 = __p1; \
    676   __ret = (bfloat16x4_t) __builtin_neon_vld1_lane_bf16(__p0, (int8x8_t)__s1, __p2, 11); \
    677   __ret; \
    678 })
    679 #else
    680 #define vld1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    681   bfloat16x4_t __ret; \
    682   bfloat16x4_t __s1 = __p1; \
    683   bfloat16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
    684   __ret = (bfloat16x4_t) __builtin_neon_vld1_lane_bf16(__p0, (int8x8_t)__rev1, __p2, 11); \
    685   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
    686   __ret; \
    687 })
    688 #endif
    689 
    690 #ifdef __LITTLE_ENDIAN__
    691 #define vld1q_bf16_x2(__p0) __extension__ ({ \
    692   bfloat16x8x2_t __ret; \
    693   __builtin_neon_vld1q_bf16_x2(&__ret, __p0, 43); \
    694   __ret; \
    695 })
    696 #else
    697 #define vld1q_bf16_x2(__p0) __extension__ ({ \
    698   bfloat16x8x2_t __ret; \
    699   __builtin_neon_vld1q_bf16_x2(&__ret, __p0, 43); \
    700  \
    701   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    702   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    703   __ret; \
    704 })
    705 #endif
    706 
    707 #ifdef __LITTLE_ENDIAN__
    708 #define vld1_bf16_x2(__p0) __extension__ ({ \
    709   bfloat16x4x2_t __ret; \
    710   __builtin_neon_vld1_bf16_x2(&__ret, __p0, 11); \
    711   __ret; \
    712 })
    713 #else
    714 #define vld1_bf16_x2(__p0) __extension__ ({ \
    715   bfloat16x4x2_t __ret; \
    716   __builtin_neon_vld1_bf16_x2(&__ret, __p0, 11); \
    717  \
    718   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    719   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    720   __ret; \
    721 })
    722 #endif
    723 
    724 #ifdef __LITTLE_ENDIAN__
    725 #define vld1q_bf16_x3(__p0) __extension__ ({ \
    726   bfloat16x8x3_t __ret; \
    727   __builtin_neon_vld1q_bf16_x3(&__ret, __p0, 43); \
    728   __ret; \
    729 })
    730 #else
    731 #define vld1q_bf16_x3(__p0) __extension__ ({ \
    732   bfloat16x8x3_t __ret; \
    733   __builtin_neon_vld1q_bf16_x3(&__ret, __p0, 43); \
    734  \
    735   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    736   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    737   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
    738   __ret; \
    739 })
    740 #endif
    741 
    742 #ifdef __LITTLE_ENDIAN__
    743 #define vld1_bf16_x3(__p0) __extension__ ({ \
    744   bfloat16x4x3_t __ret; \
    745   __builtin_neon_vld1_bf16_x3(&__ret, __p0, 11); \
    746   __ret; \
    747 })
    748 #else
    749 #define vld1_bf16_x3(__p0) __extension__ ({ \
    750   bfloat16x4x3_t __ret; \
    751   __builtin_neon_vld1_bf16_x3(&__ret, __p0, 11); \
    752  \
    753   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    754   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    755   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
    756   __ret; \
    757 })
    758 #endif
    759 
    760 #ifdef __LITTLE_ENDIAN__
    761 #define vld1q_bf16_x4(__p0) __extension__ ({ \
    762   bfloat16x8x4_t __ret; \
    763   __builtin_neon_vld1q_bf16_x4(&__ret, __p0, 43); \
    764   __ret; \
    765 })
    766 #else
    767 #define vld1q_bf16_x4(__p0) __extension__ ({ \
    768   bfloat16x8x4_t __ret; \
    769   __builtin_neon_vld1q_bf16_x4(&__ret, __p0, 43); \
    770  \
    771   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    772   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    773   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
    774   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
    775   __ret; \
    776 })
    777 #endif
    778 
    779 #ifdef __LITTLE_ENDIAN__
    780 #define vld1_bf16_x4(__p0) __extension__ ({ \
    781   bfloat16x4x4_t __ret; \
    782   __builtin_neon_vld1_bf16_x4(&__ret, __p0, 11); \
    783   __ret; \
    784 })
    785 #else
    786 #define vld1_bf16_x4(__p0) __extension__ ({ \
    787   bfloat16x4x4_t __ret; \
    788   __builtin_neon_vld1_bf16_x4(&__ret, __p0, 11); \
    789  \
    790   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    791   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    792   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
    793   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
    794   __ret; \
    795 })
    796 #endif
    797 
    798 #ifdef __LITTLE_ENDIAN__
    799 #define vld2q_bf16(__p0) __extension__ ({ \
    800   bfloat16x8x2_t __ret; \
    801   __builtin_neon_vld2q_bf16(&__ret, __p0, 43); \
    802   __ret; \
    803 })
    804 #else
    805 #define vld2q_bf16(__p0) __extension__ ({ \
    806   bfloat16x8x2_t __ret; \
    807   __builtin_neon_vld2q_bf16(&__ret, __p0, 43); \
    808  \
    809   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    810   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    811   __ret; \
    812 })
    813 #endif
    814 
    815 #ifdef __LITTLE_ENDIAN__
    816 #define vld2_bf16(__p0) __extension__ ({ \
    817   bfloat16x4x2_t __ret; \
    818   __builtin_neon_vld2_bf16(&__ret, __p0, 11); \
    819   __ret; \
    820 })
    821 #else
    822 #define vld2_bf16(__p0) __extension__ ({ \
    823   bfloat16x4x2_t __ret; \
    824   __builtin_neon_vld2_bf16(&__ret, __p0, 11); \
    825  \
    826   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    827   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    828   __ret; \
    829 })
    830 #endif
    831 
    832 #ifdef __LITTLE_ENDIAN__
    833 #define vld2q_dup_bf16(__p0) __extension__ ({ \
    834   bfloat16x8x2_t __ret; \
    835   __builtin_neon_vld2q_dup_bf16(&__ret, __p0, 43); \
    836   __ret; \
    837 })
    838 #else
    839 #define vld2q_dup_bf16(__p0) __extension__ ({ \
    840   bfloat16x8x2_t __ret; \
    841   __builtin_neon_vld2q_dup_bf16(&__ret, __p0, 43); \
    842  \
    843   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    844   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    845   __ret; \
    846 })
    847 #endif
    848 
    849 #ifdef __LITTLE_ENDIAN__
    850 #define vld2_dup_bf16(__p0) __extension__ ({ \
    851   bfloat16x4x2_t __ret; \
    852   __builtin_neon_vld2_dup_bf16(&__ret, __p0, 11); \
    853   __ret; \
    854 })
    855 #else
    856 #define vld2_dup_bf16(__p0) __extension__ ({ \
    857   bfloat16x4x2_t __ret; \
    858   __builtin_neon_vld2_dup_bf16(&__ret, __p0, 11); \
    859  \
    860   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    861   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    862   __ret; \
    863 })
    864 #endif
    865 
    866 #ifdef __LITTLE_ENDIAN__
    867 #define vld2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    868   bfloat16x8x2_t __ret; \
    869   bfloat16x8x2_t __s1 = __p1; \
    870   __builtin_neon_vld2q_lane_bf16(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 43); \
    871   __ret; \
    872 })
    873 #else
    874 #define vld2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    875   bfloat16x8x2_t __ret; \
    876   bfloat16x8x2_t __s1 = __p1; \
    877   bfloat16x8x2_t __rev1; \
    878   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    879   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    880   __builtin_neon_vld2q_lane_bf16(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 43); \
    881  \
    882   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    883   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    884   __ret; \
    885 })
    886 #endif
    887 
    888 #ifdef __LITTLE_ENDIAN__
    889 #define vld2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    890   bfloat16x4x2_t __ret; \
    891   bfloat16x4x2_t __s1 = __p1; \
    892   __builtin_neon_vld2_lane_bf16(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 11); \
    893   __ret; \
    894 })
    895 #else
    896 #define vld2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    897   bfloat16x4x2_t __ret; \
    898   bfloat16x4x2_t __s1 = __p1; \
    899   bfloat16x4x2_t __rev1; \
    900   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
    901   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
    902   __builtin_neon_vld2_lane_bf16(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 11); \
    903  \
    904   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    905   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    906   __ret; \
    907 })
    908 #endif
    909 
    910 #ifdef __LITTLE_ENDIAN__
    911 #define vld3q_bf16(__p0) __extension__ ({ \
    912   bfloat16x8x3_t __ret; \
    913   __builtin_neon_vld3q_bf16(&__ret, __p0, 43); \
    914   __ret; \
    915 })
    916 #else
    917 #define vld3q_bf16(__p0) __extension__ ({ \
    918   bfloat16x8x3_t __ret; \
    919   __builtin_neon_vld3q_bf16(&__ret, __p0, 43); \
    920  \
    921   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    922   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    923   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
    924   __ret; \
    925 })
    926 #endif
    927 
    928 #ifdef __LITTLE_ENDIAN__
    929 #define vld3_bf16(__p0) __extension__ ({ \
    930   bfloat16x4x3_t __ret; \
    931   __builtin_neon_vld3_bf16(&__ret, __p0, 11); \
    932   __ret; \
    933 })
    934 #else
    935 #define vld3_bf16(__p0) __extension__ ({ \
    936   bfloat16x4x3_t __ret; \
    937   __builtin_neon_vld3_bf16(&__ret, __p0, 11); \
    938  \
    939   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    940   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    941   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
    942   __ret; \
    943 })
    944 #endif
    945 
    946 #ifdef __LITTLE_ENDIAN__
    947 #define vld3q_dup_bf16(__p0) __extension__ ({ \
    948   bfloat16x8x3_t __ret; \
    949   __builtin_neon_vld3q_dup_bf16(&__ret, __p0, 43); \
    950   __ret; \
    951 })
    952 #else
    953 #define vld3q_dup_bf16(__p0) __extension__ ({ \
    954   bfloat16x8x3_t __ret; \
    955   __builtin_neon_vld3q_dup_bf16(&__ret, __p0, 43); \
    956  \
    957   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    958   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    959   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
    960   __ret; \
    961 })
    962 #endif
    963 
    964 #ifdef __LITTLE_ENDIAN__
    965 #define vld3_dup_bf16(__p0) __extension__ ({ \
    966   bfloat16x4x3_t __ret; \
    967   __builtin_neon_vld3_dup_bf16(&__ret, __p0, 11); \
    968   __ret; \
    969 })
    970 #else
    971 #define vld3_dup_bf16(__p0) __extension__ ({ \
    972   bfloat16x4x3_t __ret; \
    973   __builtin_neon_vld3_dup_bf16(&__ret, __p0, 11); \
    974  \
    975   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
    976   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
    977   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
    978   __ret; \
    979 })
    980 #endif
    981 
    982 #ifdef __LITTLE_ENDIAN__
    983 #define vld3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    984   bfloat16x8x3_t __ret; \
    985   bfloat16x8x3_t __s1 = __p1; \
    986   __builtin_neon_vld3q_lane_bf16(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 43); \
    987   __ret; \
    988 })
    989 #else
    990 #define vld3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
    991   bfloat16x8x3_t __ret; \
    992   bfloat16x8x3_t __s1 = __p1; \
    993   bfloat16x8x3_t __rev1; \
    994   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
    995   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
    996   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
    997   __builtin_neon_vld3q_lane_bf16(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 43); \
    998  \
    999   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1000   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1001   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1002   __ret; \
   1003 })
   1004 #endif
   1005 
   1006 #ifdef __LITTLE_ENDIAN__
   1007 #define vld3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1008   bfloat16x4x3_t __ret; \
   1009   bfloat16x4x3_t __s1 = __p1; \
   1010   __builtin_neon_vld3_lane_bf16(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 11); \
   1011   __ret; \
   1012 })
   1013 #else
   1014 #define vld3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1015   bfloat16x4x3_t __ret; \
   1016   bfloat16x4x3_t __s1 = __p1; \
   1017   bfloat16x4x3_t __rev1; \
   1018   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1019   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1020   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1021   __builtin_neon_vld3_lane_bf16(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 11); \
   1022  \
   1023   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
   1024   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
   1025   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
   1026   __ret; \
   1027 })
   1028 #endif
   1029 
   1030 #ifdef __LITTLE_ENDIAN__
   1031 #define vld4q_bf16(__p0) __extension__ ({ \
   1032   bfloat16x8x4_t __ret; \
   1033   __builtin_neon_vld4q_bf16(&__ret, __p0, 43); \
   1034   __ret; \
   1035 })
   1036 #else
   1037 #define vld4q_bf16(__p0) __extension__ ({ \
   1038   bfloat16x8x4_t __ret; \
   1039   __builtin_neon_vld4q_bf16(&__ret, __p0, 43); \
   1040  \
   1041   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1042   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1043   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1044   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1045   __ret; \
   1046 })
   1047 #endif
   1048 
   1049 #ifdef __LITTLE_ENDIAN__
   1050 #define vld4_bf16(__p0) __extension__ ({ \
   1051   bfloat16x4x4_t __ret; \
   1052   __builtin_neon_vld4_bf16(&__ret, __p0, 11); \
   1053   __ret; \
   1054 })
   1055 #else
   1056 #define vld4_bf16(__p0) __extension__ ({ \
   1057   bfloat16x4x4_t __ret; \
   1058   __builtin_neon_vld4_bf16(&__ret, __p0, 11); \
   1059  \
   1060   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
   1061   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
   1062   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
   1063   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
   1064   __ret; \
   1065 })
   1066 #endif
   1067 
   1068 #ifdef __LITTLE_ENDIAN__
   1069 #define vld4q_dup_bf16(__p0) __extension__ ({ \
   1070   bfloat16x8x4_t __ret; \
   1071   __builtin_neon_vld4q_dup_bf16(&__ret, __p0, 43); \
   1072   __ret; \
   1073 })
   1074 #else
   1075 #define vld4q_dup_bf16(__p0) __extension__ ({ \
   1076   bfloat16x8x4_t __ret; \
   1077   __builtin_neon_vld4q_dup_bf16(&__ret, __p0, 43); \
   1078  \
   1079   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1080   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1081   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1082   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1083   __ret; \
   1084 })
   1085 #endif
   1086 
   1087 #ifdef __LITTLE_ENDIAN__
   1088 #define vld4_dup_bf16(__p0) __extension__ ({ \
   1089   bfloat16x4x4_t __ret; \
   1090   __builtin_neon_vld4_dup_bf16(&__ret, __p0, 11); \
   1091   __ret; \
   1092 })
   1093 #else
   1094 #define vld4_dup_bf16(__p0) __extension__ ({ \
   1095   bfloat16x4x4_t __ret; \
   1096   __builtin_neon_vld4_dup_bf16(&__ret, __p0, 11); \
   1097  \
   1098   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
   1099   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
   1100   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
   1101   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
   1102   __ret; \
   1103 })
   1104 #endif
   1105 
   1106 #ifdef __LITTLE_ENDIAN__
   1107 #define vld4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1108   bfloat16x8x4_t __ret; \
   1109   bfloat16x8x4_t __s1 = __p1; \
   1110   __builtin_neon_vld4q_lane_bf16(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 43); \
   1111   __ret; \
   1112 })
   1113 #else
   1114 #define vld4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1115   bfloat16x8x4_t __ret; \
   1116   bfloat16x8x4_t __s1 = __p1; \
   1117   bfloat16x8x4_t __rev1; \
   1118   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1119   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1120   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1121   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1122   __builtin_neon_vld4q_lane_bf16(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 43); \
   1123  \
   1124   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1125   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1126   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1127   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1128   __ret; \
   1129 })
   1130 #endif
   1131 
   1132 #ifdef __LITTLE_ENDIAN__
   1133 #define vld4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1134   bfloat16x4x4_t __ret; \
   1135   bfloat16x4x4_t __s1 = __p1; \
   1136   __builtin_neon_vld4_lane_bf16(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 11); \
   1137   __ret; \
   1138 })
   1139 #else
   1140 #define vld4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1141   bfloat16x4x4_t __ret; \
   1142   bfloat16x4x4_t __s1 = __p1; \
   1143   bfloat16x4x4_t __rev1; \
   1144   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1145   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1146   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1147   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
   1148   __builtin_neon_vld4_lane_bf16(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 11); \
   1149  \
   1150   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
   1151   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
   1152   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
   1153   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
   1154   __ret; \
   1155 })
   1156 #endif
   1157 
   1158 #ifdef __LITTLE_ENDIAN__
   1159 #define vsetq_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1160   bfloat16x8_t __ret; \
   1161   bfloat16_t __s0 = __p0; \
   1162   bfloat16x8_t __s1 = __p1; \
   1163   __ret = (bfloat16x8_t) __builtin_neon_vsetq_lane_bf16(__s0, (bfloat16x8_t)__s1, __p2); \
   1164   __ret; \
   1165 })
   1166 #else
   1167 #define vsetq_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1168   bfloat16x8_t __ret; \
   1169   bfloat16_t __s0 = __p0; \
   1170   bfloat16x8_t __s1 = __p1; \
   1171   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
   1172   __ret = (bfloat16x8_t) __builtin_neon_vsetq_lane_bf16(__s0, (bfloat16x8_t)__rev1, __p2); \
   1173   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   1174   __ret; \
   1175 })
   1176 #define __noswap_vsetq_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1177   bfloat16x8_t __ret; \
   1178   bfloat16_t __s0 = __p0; \
   1179   bfloat16x8_t __s1 = __p1; \
   1180   __ret = (bfloat16x8_t) __builtin_neon_vsetq_lane_bf16(__s0, (bfloat16x8_t)__s1, __p2); \
   1181   __ret; \
   1182 })
   1183 #endif
   1184 
   1185 #ifdef __LITTLE_ENDIAN__
   1186 #define vset_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1187   bfloat16x4_t __ret; \
   1188   bfloat16_t __s0 = __p0; \
   1189   bfloat16x4_t __s1 = __p1; \
   1190   __ret = (bfloat16x4_t) __builtin_neon_vset_lane_bf16(__s0, (bfloat16x4_t)__s1, __p2); \
   1191   __ret; \
   1192 })
   1193 #else
   1194 #define vset_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1195   bfloat16x4_t __ret; \
   1196   bfloat16_t __s0 = __p0; \
   1197   bfloat16x4_t __s1 = __p1; \
   1198   bfloat16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
   1199   __ret = (bfloat16x4_t) __builtin_neon_vset_lane_bf16(__s0, (bfloat16x4_t)__rev1, __p2); \
   1200   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   1201   __ret; \
   1202 })
   1203 #define __noswap_vset_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1204   bfloat16x4_t __ret; \
   1205   bfloat16_t __s0 = __p0; \
   1206   bfloat16x4_t __s1 = __p1; \
   1207   __ret = (bfloat16x4_t) __builtin_neon_vset_lane_bf16(__s0, (bfloat16x4_t)__s1, __p2); \
   1208   __ret; \
   1209 })
   1210 #endif
   1211 
   1212 #ifdef __LITTLE_ENDIAN__
   1213 #define vst1q_bf16(__p0, __p1) __extension__ ({ \
   1214   bfloat16x8_t __s1 = __p1; \
   1215   __builtin_neon_vst1q_bf16(__p0, (int8x16_t)__s1, 43); \
   1216 })
   1217 #else
   1218 #define vst1q_bf16(__p0, __p1) __extension__ ({ \
   1219   bfloat16x8_t __s1 = __p1; \
   1220   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
   1221   __builtin_neon_vst1q_bf16(__p0, (int8x16_t)__rev1, 43); \
   1222 })
   1223 #endif
   1224 
   1225 #ifdef __LITTLE_ENDIAN__
   1226 #define vst1_bf16(__p0, __p1) __extension__ ({ \
   1227   bfloat16x4_t __s1 = __p1; \
   1228   __builtin_neon_vst1_bf16(__p0, (int8x8_t)__s1, 11); \
   1229 })
   1230 #else
   1231 #define vst1_bf16(__p0, __p1) __extension__ ({ \
   1232   bfloat16x4_t __s1 = __p1; \
   1233   bfloat16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
   1234   __builtin_neon_vst1_bf16(__p0, (int8x8_t)__rev1, 11); \
   1235 })
   1236 #endif
   1237 
   1238 #ifdef __LITTLE_ENDIAN__
   1239 #define vst1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1240   bfloat16x8_t __s1 = __p1; \
   1241   __builtin_neon_vst1q_lane_bf16(__p0, (int8x16_t)__s1, __p2, 43); \
   1242 })
   1243 #else
   1244 #define vst1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1245   bfloat16x8_t __s1 = __p1; \
   1246   bfloat16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
   1247   __builtin_neon_vst1q_lane_bf16(__p0, (int8x16_t)__rev1, __p2, 43); \
   1248 })
   1249 #endif
   1250 
   1251 #ifdef __LITTLE_ENDIAN__
   1252 #define vst1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1253   bfloat16x4_t __s1 = __p1; \
   1254   __builtin_neon_vst1_lane_bf16(__p0, (int8x8_t)__s1, __p2, 11); \
   1255 })
   1256 #else
   1257 #define vst1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1258   bfloat16x4_t __s1 = __p1; \
   1259   bfloat16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
   1260   __builtin_neon_vst1_lane_bf16(__p0, (int8x8_t)__rev1, __p2, 11); \
   1261 })
   1262 #endif
   1263 
   1264 #ifdef __LITTLE_ENDIAN__
   1265 #define vst1q_bf16_x2(__p0, __p1) __extension__ ({ \
   1266   bfloat16x8x2_t __s1 = __p1; \
   1267   __builtin_neon_vst1q_bf16_x2(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 43); \
   1268 })
   1269 #else
   1270 #define vst1q_bf16_x2(__p0, __p1) __extension__ ({ \
   1271   bfloat16x8x2_t __s1 = __p1; \
   1272   bfloat16x8x2_t __rev1; \
   1273   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1274   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1275   __builtin_neon_vst1q_bf16_x2(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 43); \
   1276 })
   1277 #endif
   1278 
   1279 #ifdef __LITTLE_ENDIAN__
   1280 #define vst1_bf16_x2(__p0, __p1) __extension__ ({ \
   1281   bfloat16x4x2_t __s1 = __p1; \
   1282   __builtin_neon_vst1_bf16_x2(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 11); \
   1283 })
   1284 #else
   1285 #define vst1_bf16_x2(__p0, __p1) __extension__ ({ \
   1286   bfloat16x4x2_t __s1 = __p1; \
   1287   bfloat16x4x2_t __rev1; \
   1288   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1289   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1290   __builtin_neon_vst1_bf16_x2(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 11); \
   1291 })
   1292 #endif
   1293 
   1294 #ifdef __LITTLE_ENDIAN__
   1295 #define vst1q_bf16_x3(__p0, __p1) __extension__ ({ \
   1296   bfloat16x8x3_t __s1 = __p1; \
   1297   __builtin_neon_vst1q_bf16_x3(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 43); \
   1298 })
   1299 #else
   1300 #define vst1q_bf16_x3(__p0, __p1) __extension__ ({ \
   1301   bfloat16x8x3_t __s1 = __p1; \
   1302   bfloat16x8x3_t __rev1; \
   1303   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1304   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1305   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1306   __builtin_neon_vst1q_bf16_x3(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 43); \
   1307 })
   1308 #endif
   1309 
   1310 #ifdef __LITTLE_ENDIAN__
   1311 #define vst1_bf16_x3(__p0, __p1) __extension__ ({ \
   1312   bfloat16x4x3_t __s1 = __p1; \
   1313   __builtin_neon_vst1_bf16_x3(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 11); \
   1314 })
   1315 #else
   1316 #define vst1_bf16_x3(__p0, __p1) __extension__ ({ \
   1317   bfloat16x4x3_t __s1 = __p1; \
   1318   bfloat16x4x3_t __rev1; \
   1319   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1320   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1321   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1322   __builtin_neon_vst1_bf16_x3(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 11); \
   1323 })
   1324 #endif
   1325 
   1326 #ifdef __LITTLE_ENDIAN__
   1327 #define vst1q_bf16_x4(__p0, __p1) __extension__ ({ \
   1328   bfloat16x8x4_t __s1 = __p1; \
   1329   __builtin_neon_vst1q_bf16_x4(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 43); \
   1330 })
   1331 #else
   1332 #define vst1q_bf16_x4(__p0, __p1) __extension__ ({ \
   1333   bfloat16x8x4_t __s1 = __p1; \
   1334   bfloat16x8x4_t __rev1; \
   1335   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1336   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1337   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1338   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1339   __builtin_neon_vst1q_bf16_x4(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 43); \
   1340 })
   1341 #endif
   1342 
   1343 #ifdef __LITTLE_ENDIAN__
   1344 #define vst1_bf16_x4(__p0, __p1) __extension__ ({ \
   1345   bfloat16x4x4_t __s1 = __p1; \
   1346   __builtin_neon_vst1_bf16_x4(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 11); \
   1347 })
   1348 #else
   1349 #define vst1_bf16_x4(__p0, __p1) __extension__ ({ \
   1350   bfloat16x4x4_t __s1 = __p1; \
   1351   bfloat16x4x4_t __rev1; \
   1352   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1353   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1354   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1355   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
   1356   __builtin_neon_vst1_bf16_x4(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 11); \
   1357 })
   1358 #endif
   1359 
   1360 #ifdef __LITTLE_ENDIAN__
   1361 #define vst2q_bf16(__p0, __p1) __extension__ ({ \
   1362   bfloat16x8x2_t __s1 = __p1; \
   1363   __builtin_neon_vst2q_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 43); \
   1364 })
   1365 #else
   1366 #define vst2q_bf16(__p0, __p1) __extension__ ({ \
   1367   bfloat16x8x2_t __s1 = __p1; \
   1368   bfloat16x8x2_t __rev1; \
   1369   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1370   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1371   __builtin_neon_vst2q_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 43); \
   1372 })
   1373 #endif
   1374 
   1375 #ifdef __LITTLE_ENDIAN__
   1376 #define vst2_bf16(__p0, __p1) __extension__ ({ \
   1377   bfloat16x4x2_t __s1 = __p1; \
   1378   __builtin_neon_vst2_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 11); \
   1379 })
   1380 #else
   1381 #define vst2_bf16(__p0, __p1) __extension__ ({ \
   1382   bfloat16x4x2_t __s1 = __p1; \
   1383   bfloat16x4x2_t __rev1; \
   1384   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1385   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1386   __builtin_neon_vst2_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 11); \
   1387 })
   1388 #endif
   1389 
   1390 #ifdef __LITTLE_ENDIAN__
   1391 #define vst2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1392   bfloat16x8x2_t __s1 = __p1; \
   1393   __builtin_neon_vst2q_lane_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 43); \
   1394 })
   1395 #else
   1396 #define vst2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1397   bfloat16x8x2_t __s1 = __p1; \
   1398   bfloat16x8x2_t __rev1; \
   1399   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1400   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1401   __builtin_neon_vst2q_lane_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 43); \
   1402 })
   1403 #endif
   1404 
   1405 #ifdef __LITTLE_ENDIAN__
   1406 #define vst2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1407   bfloat16x4x2_t __s1 = __p1; \
   1408   __builtin_neon_vst2_lane_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 11); \
   1409 })
   1410 #else
   1411 #define vst2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1412   bfloat16x4x2_t __s1 = __p1; \
   1413   bfloat16x4x2_t __rev1; \
   1414   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1415   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1416   __builtin_neon_vst2_lane_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 11); \
   1417 })
   1418 #endif
   1419 
   1420 #ifdef __LITTLE_ENDIAN__
   1421 #define vst3q_bf16(__p0, __p1) __extension__ ({ \
   1422   bfloat16x8x3_t __s1 = __p1; \
   1423   __builtin_neon_vst3q_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 43); \
   1424 })
   1425 #else
   1426 #define vst3q_bf16(__p0, __p1) __extension__ ({ \
   1427   bfloat16x8x3_t __s1 = __p1; \
   1428   bfloat16x8x3_t __rev1; \
   1429   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1430   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1431   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1432   __builtin_neon_vst3q_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 43); \
   1433 })
   1434 #endif
   1435 
   1436 #ifdef __LITTLE_ENDIAN__
   1437 #define vst3_bf16(__p0, __p1) __extension__ ({ \
   1438   bfloat16x4x3_t __s1 = __p1; \
   1439   __builtin_neon_vst3_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 11); \
   1440 })
   1441 #else
   1442 #define vst3_bf16(__p0, __p1) __extension__ ({ \
   1443   bfloat16x4x3_t __s1 = __p1; \
   1444   bfloat16x4x3_t __rev1; \
   1445   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1446   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1447   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1448   __builtin_neon_vst3_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 11); \
   1449 })
   1450 #endif
   1451 
   1452 #ifdef __LITTLE_ENDIAN__
   1453 #define vst3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1454   bfloat16x8x3_t __s1 = __p1; \
   1455   __builtin_neon_vst3q_lane_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 43); \
   1456 })
   1457 #else
   1458 #define vst3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1459   bfloat16x8x3_t __s1 = __p1; \
   1460   bfloat16x8x3_t __rev1; \
   1461   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1462   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1463   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1464   __builtin_neon_vst3q_lane_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 43); \
   1465 })
   1466 #endif
   1467 
   1468 #ifdef __LITTLE_ENDIAN__
   1469 #define vst3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1470   bfloat16x4x3_t __s1 = __p1; \
   1471   __builtin_neon_vst3_lane_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 11); \
   1472 })
   1473 #else
   1474 #define vst3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1475   bfloat16x4x3_t __s1 = __p1; \
   1476   bfloat16x4x3_t __rev1; \
   1477   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1478   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1479   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1480   __builtin_neon_vst3_lane_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 11); \
   1481 })
   1482 #endif
   1483 
   1484 #ifdef __LITTLE_ENDIAN__
   1485 #define vst4q_bf16(__p0, __p1) __extension__ ({ \
   1486   bfloat16x8x4_t __s1 = __p1; \
   1487   __builtin_neon_vst4q_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 43); \
   1488 })
   1489 #else
   1490 #define vst4q_bf16(__p0, __p1) __extension__ ({ \
   1491   bfloat16x8x4_t __s1 = __p1; \
   1492   bfloat16x8x4_t __rev1; \
   1493   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1494   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1495   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1496   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1497   __builtin_neon_vst4q_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 43); \
   1498 })
   1499 #endif
   1500 
   1501 #ifdef __LITTLE_ENDIAN__
   1502 #define vst4_bf16(__p0, __p1) __extension__ ({ \
   1503   bfloat16x4x4_t __s1 = __p1; \
   1504   __builtin_neon_vst4_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 11); \
   1505 })
   1506 #else
   1507 #define vst4_bf16(__p0, __p1) __extension__ ({ \
   1508   bfloat16x4x4_t __s1 = __p1; \
   1509   bfloat16x4x4_t __rev1; \
   1510   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1511   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1512   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1513   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
   1514   __builtin_neon_vst4_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 11); \
   1515 })
   1516 #endif
   1517 
   1518 #ifdef __LITTLE_ENDIAN__
   1519 #define vst4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1520   bfloat16x8x4_t __s1 = __p1; \
   1521   __builtin_neon_vst4q_lane_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 43); \
   1522 })
   1523 #else
   1524 #define vst4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1525   bfloat16x8x4_t __s1 = __p1; \
   1526   bfloat16x8x4_t __rev1; \
   1527   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
   1528   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
   1529   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
   1530   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
   1531   __builtin_neon_vst4q_lane_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 43); \
   1532 })
   1533 #endif
   1534 
   1535 #ifdef __LITTLE_ENDIAN__
   1536 #define vst4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1537   bfloat16x4x4_t __s1 = __p1; \
   1538   __builtin_neon_vst4_lane_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 11); \
   1539 })
   1540 #else
   1541 #define vst4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
   1542   bfloat16x4x4_t __s1 = __p1; \
   1543   bfloat16x4x4_t __rev1; \
   1544   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
   1545   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
   1546   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
   1547   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
   1548   __builtin_neon_vst4_lane_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 11); \
   1549 })
   1550 #endif
   1551 
   1552 #ifdef __LITTLE_ENDIAN__
   1553 __ai __attribute__((target("dotprod,neon"))) uint32x4_t vdotq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   1554   uint32x4_t __ret;
   1555   __ret = (uint32x4_t) __builtin_neon_vdotq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
   1556   return __ret;
   1557 }
   1558 #else
   1559 __ai __attribute__((target("dotprod,neon"))) uint32x4_t vdotq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   1560   uint32x4_t __ret;
   1561   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1562   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   1563   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   1564   __ret = (uint32x4_t) __builtin_neon_vdotq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
   1565   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1566   return __ret;
   1567 }
   1568 __ai __attribute__((target("dotprod,neon"))) uint32x4_t __noswap_vdotq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   1569   uint32x4_t __ret;
   1570   __ret = (uint32x4_t) __builtin_neon_vdotq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
   1571   return __ret;
   1572 }
   1573 #endif
   1574 
   1575 #ifdef __LITTLE_ENDIAN__
   1576 __ai __attribute__((target("dotprod,neon"))) int32x4_t vdotq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) {
   1577   int32x4_t __ret;
   1578   __ret = (int32x4_t) __builtin_neon_vdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   1579   return __ret;
   1580 }
   1581 #else
   1582 __ai __attribute__((target("dotprod,neon"))) int32x4_t vdotq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) {
   1583   int32x4_t __ret;
   1584   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1585   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   1586   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   1587   __ret = (int32x4_t) __builtin_neon_vdotq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
   1588   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1589   return __ret;
   1590 }
   1591 __ai __attribute__((target("dotprod,neon"))) int32x4_t __noswap_vdotq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) {
   1592   int32x4_t __ret;
   1593   __ret = (int32x4_t) __builtin_neon_vdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   1594   return __ret;
   1595 }
   1596 #endif
   1597 
   1598 #ifdef __LITTLE_ENDIAN__
   1599 __ai __attribute__((target("dotprod,neon"))) uint32x2_t vdot_u32(uint32x2_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
   1600   uint32x2_t __ret;
   1601   __ret = (uint32x2_t) __builtin_neon_vdot_u32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 18);
   1602   return __ret;
   1603 }
   1604 #else
   1605 __ai __attribute__((target("dotprod,neon"))) uint32x2_t vdot_u32(uint32x2_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
   1606   uint32x2_t __ret;
   1607   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   1608   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1609   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   1610   __ret = (uint32x2_t) __builtin_neon_vdot_u32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 18);
   1611   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   1612   return __ret;
   1613 }
   1614 __ai __attribute__((target("dotprod,neon"))) uint32x2_t __noswap_vdot_u32(uint32x2_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
   1615   uint32x2_t __ret;
   1616   __ret = (uint32x2_t) __builtin_neon_vdot_u32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 18);
   1617   return __ret;
   1618 }
   1619 #endif
   1620 
   1621 #ifdef __LITTLE_ENDIAN__
   1622 __ai __attribute__((target("dotprod,neon"))) int32x2_t vdot_s32(int32x2_t __p0, int8x8_t __p1, int8x8_t __p2) {
   1623   int32x2_t __ret;
   1624   __ret = (int32x2_t) __builtin_neon_vdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
   1625   return __ret;
   1626 }
   1627 #else
   1628 __ai __attribute__((target("dotprod,neon"))) int32x2_t vdot_s32(int32x2_t __p0, int8x8_t __p1, int8x8_t __p2) {
   1629   int32x2_t __ret;
   1630   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   1631   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1632   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   1633   __ret = (int32x2_t) __builtin_neon_vdot_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2);
   1634   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   1635   return __ret;
   1636 }
   1637 __ai __attribute__((target("dotprod,neon"))) int32x2_t __noswap_vdot_s32(int32x2_t __p0, int8x8_t __p1, int8x8_t __p2) {
   1638   int32x2_t __ret;
   1639   __ret = (int32x2_t) __builtin_neon_vdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
   1640   return __ret;
   1641 }
   1642 #endif
   1643 
   1644 #ifdef __LITTLE_ENDIAN__
   1645 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabdq_f16(float16x8_t __p0, float16x8_t __p1) {
   1646   float16x8_t __ret;
   1647   __ret = (float16x8_t) __builtin_neon_vabdq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
   1648   return __ret;
   1649 }
   1650 #else
   1651 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabdq_f16(float16x8_t __p0, float16x8_t __p1) {
   1652   float16x8_t __ret;
   1653   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1654   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1655   __ret = (float16x8_t) __builtin_neon_vabdq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
   1656   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1657   return __ret;
   1658 }
   1659 #endif
   1660 
   1661 #ifdef __LITTLE_ENDIAN__
   1662 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabd_f16(float16x4_t __p0, float16x4_t __p1) {
   1663   float16x4_t __ret;
   1664   __ret = (float16x4_t) __builtin_neon_vabd_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   1665   return __ret;
   1666 }
   1667 #else
   1668 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabd_f16(float16x4_t __p0, float16x4_t __p1) {
   1669   float16x4_t __ret;
   1670   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1671   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1672   __ret = (float16x4_t) __builtin_neon_vabd_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   1673   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1674   return __ret;
   1675 }
   1676 #endif
   1677 
   1678 #ifdef __LITTLE_ENDIAN__
   1679 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabsq_f16(float16x8_t __p0) {
   1680   float16x8_t __ret;
   1681   __ret = (float16x8_t) __builtin_neon_vabsq_f16((int8x16_t)__p0, 40);
   1682   return __ret;
   1683 }
   1684 #else
   1685 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabsq_f16(float16x8_t __p0) {
   1686   float16x8_t __ret;
   1687   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1688   __ret = (float16x8_t) __builtin_neon_vabsq_f16((int8x16_t)__rev0, 40);
   1689   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1690   return __ret;
   1691 }
   1692 #endif
   1693 
   1694 #ifdef __LITTLE_ENDIAN__
   1695 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabs_f16(float16x4_t __p0) {
   1696   float16x4_t __ret;
   1697   __ret = (float16x4_t) __builtin_neon_vabs_f16((int8x8_t)__p0, 8);
   1698   return __ret;
   1699 }
   1700 #else
   1701 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabs_f16(float16x4_t __p0) {
   1702   float16x4_t __ret;
   1703   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1704   __ret = (float16x4_t) __builtin_neon_vabs_f16((int8x8_t)__rev0, 8);
   1705   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1706   return __ret;
   1707 }
   1708 #endif
   1709 
   1710 #ifdef __LITTLE_ENDIAN__
   1711 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vaddq_f16(float16x8_t __p0, float16x8_t __p1) {
   1712   float16x8_t __ret;
   1713   __ret = __p0 + __p1;
   1714   return __ret;
   1715 }
   1716 #else
   1717 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vaddq_f16(float16x8_t __p0, float16x8_t __p1) {
   1718   float16x8_t __ret;
   1719   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1720   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1721   __ret = __rev0 + __rev1;
   1722   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1723   return __ret;
   1724 }
   1725 #endif
   1726 
   1727 #ifdef __LITTLE_ENDIAN__
   1728 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vadd_f16(float16x4_t __p0, float16x4_t __p1) {
   1729   float16x4_t __ret;
   1730   __ret = __p0 + __p1;
   1731   return __ret;
   1732 }
   1733 #else
   1734 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vadd_f16(float16x4_t __p0, float16x4_t __p1) {
   1735   float16x4_t __ret;
   1736   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1737   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1738   __ret = __rev0 + __rev1;
   1739   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1740   return __ret;
   1741 }
   1742 #endif
   1743 
   1744 #ifdef __LITTLE_ENDIAN__
   1745 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcageq_f16(float16x8_t __p0, float16x8_t __p1) {
   1746   uint16x8_t __ret;
   1747   __ret = (uint16x8_t) __builtin_neon_vcageq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49);
   1748   return __ret;
   1749 }
   1750 #else
   1751 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcageq_f16(float16x8_t __p0, float16x8_t __p1) {
   1752   uint16x8_t __ret;
   1753   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1754   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1755   __ret = (uint16x8_t) __builtin_neon_vcageq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
   1756   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1757   return __ret;
   1758 }
   1759 #endif
   1760 
   1761 #ifdef __LITTLE_ENDIAN__
   1762 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcage_f16(float16x4_t __p0, float16x4_t __p1) {
   1763   uint16x4_t __ret;
   1764   __ret = (uint16x4_t) __builtin_neon_vcage_f16((int8x8_t)__p0, (int8x8_t)__p1, 17);
   1765   return __ret;
   1766 }
   1767 #else
   1768 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcage_f16(float16x4_t __p0, float16x4_t __p1) {
   1769   uint16x4_t __ret;
   1770   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1771   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1772   __ret = (uint16x4_t) __builtin_neon_vcage_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
   1773   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1774   return __ret;
   1775 }
   1776 #endif
   1777 
   1778 #ifdef __LITTLE_ENDIAN__
   1779 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcagtq_f16(float16x8_t __p0, float16x8_t __p1) {
   1780   uint16x8_t __ret;
   1781   __ret = (uint16x8_t) __builtin_neon_vcagtq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49);
   1782   return __ret;
   1783 }
   1784 #else
   1785 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcagtq_f16(float16x8_t __p0, float16x8_t __p1) {
   1786   uint16x8_t __ret;
   1787   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1788   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1789   __ret = (uint16x8_t) __builtin_neon_vcagtq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
   1790   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1791   return __ret;
   1792 }
   1793 #endif
   1794 
   1795 #ifdef __LITTLE_ENDIAN__
   1796 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcagt_f16(float16x4_t __p0, float16x4_t __p1) {
   1797   uint16x4_t __ret;
   1798   __ret = (uint16x4_t) __builtin_neon_vcagt_f16((int8x8_t)__p0, (int8x8_t)__p1, 17);
   1799   return __ret;
   1800 }
   1801 #else
   1802 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcagt_f16(float16x4_t __p0, float16x4_t __p1) {
   1803   uint16x4_t __ret;
   1804   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1805   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1806   __ret = (uint16x4_t) __builtin_neon_vcagt_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
   1807   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1808   return __ret;
   1809 }
   1810 #endif
   1811 
   1812 #ifdef __LITTLE_ENDIAN__
   1813 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaleq_f16(float16x8_t __p0, float16x8_t __p1) {
   1814   uint16x8_t __ret;
   1815   __ret = (uint16x8_t) __builtin_neon_vcaleq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49);
   1816   return __ret;
   1817 }
   1818 #else
   1819 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaleq_f16(float16x8_t __p0, float16x8_t __p1) {
   1820   uint16x8_t __ret;
   1821   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1822   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1823   __ret = (uint16x8_t) __builtin_neon_vcaleq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
   1824   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1825   return __ret;
   1826 }
   1827 #endif
   1828 
   1829 #ifdef __LITTLE_ENDIAN__
   1830 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcale_f16(float16x4_t __p0, float16x4_t __p1) {
   1831   uint16x4_t __ret;
   1832   __ret = (uint16x4_t) __builtin_neon_vcale_f16((int8x8_t)__p0, (int8x8_t)__p1, 17);
   1833   return __ret;
   1834 }
   1835 #else
   1836 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcale_f16(float16x4_t __p0, float16x4_t __p1) {
   1837   uint16x4_t __ret;
   1838   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1839   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1840   __ret = (uint16x4_t) __builtin_neon_vcale_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
   1841   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1842   return __ret;
   1843 }
   1844 #endif
   1845 
   1846 #ifdef __LITTLE_ENDIAN__
   1847 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaltq_f16(float16x8_t __p0, float16x8_t __p1) {
   1848   uint16x8_t __ret;
   1849   __ret = (uint16x8_t) __builtin_neon_vcaltq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49);
   1850   return __ret;
   1851 }
   1852 #else
   1853 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaltq_f16(float16x8_t __p0, float16x8_t __p1) {
   1854   uint16x8_t __ret;
   1855   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1856   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1857   __ret = (uint16x8_t) __builtin_neon_vcaltq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
   1858   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1859   return __ret;
   1860 }
   1861 #endif
   1862 
   1863 #ifdef __LITTLE_ENDIAN__
   1864 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcalt_f16(float16x4_t __p0, float16x4_t __p1) {
   1865   uint16x4_t __ret;
   1866   __ret = (uint16x4_t) __builtin_neon_vcalt_f16((int8x8_t)__p0, (int8x8_t)__p1, 17);
   1867   return __ret;
   1868 }
   1869 #else
   1870 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcalt_f16(float16x4_t __p0, float16x4_t __p1) {
   1871   uint16x4_t __ret;
   1872   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1873   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1874   __ret = (uint16x4_t) __builtin_neon_vcalt_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
   1875   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1876   return __ret;
   1877 }
   1878 #endif
   1879 
   1880 #ifdef __LITTLE_ENDIAN__
   1881 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqq_f16(float16x8_t __p0, float16x8_t __p1) {
   1882   uint16x8_t __ret;
   1883   __ret = (uint16x8_t)(__p0 == __p1);
   1884   return __ret;
   1885 }
   1886 #else
   1887 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqq_f16(float16x8_t __p0, float16x8_t __p1) {
   1888   uint16x8_t __ret;
   1889   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1890   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1891   __ret = (uint16x8_t)(__rev0 == __rev1);
   1892   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1893   return __ret;
   1894 }
   1895 #endif
   1896 
   1897 #ifdef __LITTLE_ENDIAN__
   1898 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceq_f16(float16x4_t __p0, float16x4_t __p1) {
   1899   uint16x4_t __ret;
   1900   __ret = (uint16x4_t)(__p0 == __p1);
   1901   return __ret;
   1902 }
   1903 #else
   1904 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceq_f16(float16x4_t __p0, float16x4_t __p1) {
   1905   uint16x4_t __ret;
   1906   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1907   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1908   __ret = (uint16x4_t)(__rev0 == __rev1);
   1909   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1910   return __ret;
   1911 }
   1912 #endif
   1913 
   1914 #ifdef __LITTLE_ENDIAN__
   1915 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqzq_f16(float16x8_t __p0) {
   1916   uint16x8_t __ret;
   1917   __ret = (uint16x8_t) __builtin_neon_vceqzq_f16((int8x16_t)__p0, 49);
   1918   return __ret;
   1919 }
   1920 #else
   1921 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqzq_f16(float16x8_t __p0) {
   1922   uint16x8_t __ret;
   1923   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1924   __ret = (uint16x8_t) __builtin_neon_vceqzq_f16((int8x16_t)__rev0, 49);
   1925   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1926   return __ret;
   1927 }
   1928 #endif
   1929 
   1930 #ifdef __LITTLE_ENDIAN__
   1931 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceqz_f16(float16x4_t __p0) {
   1932   uint16x4_t __ret;
   1933   __ret = (uint16x4_t) __builtin_neon_vceqz_f16((int8x8_t)__p0, 17);
   1934   return __ret;
   1935 }
   1936 #else
   1937 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceqz_f16(float16x4_t __p0) {
   1938   uint16x4_t __ret;
   1939   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1940   __ret = (uint16x4_t) __builtin_neon_vceqz_f16((int8x8_t)__rev0, 17);
   1941   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1942   return __ret;
   1943 }
   1944 #endif
   1945 
   1946 #ifdef __LITTLE_ENDIAN__
   1947 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgeq_f16(float16x8_t __p0, float16x8_t __p1) {
   1948   uint16x8_t __ret;
   1949   __ret = (uint16x8_t)(__p0 >= __p1);
   1950   return __ret;
   1951 }
   1952 #else
   1953 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgeq_f16(float16x8_t __p0, float16x8_t __p1) {
   1954   uint16x8_t __ret;
   1955   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1956   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   1957   __ret = (uint16x8_t)(__rev0 >= __rev1);
   1958   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1959   return __ret;
   1960 }
   1961 #endif
   1962 
   1963 #ifdef __LITTLE_ENDIAN__
   1964 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcge_f16(float16x4_t __p0, float16x4_t __p1) {
   1965   uint16x4_t __ret;
   1966   __ret = (uint16x4_t)(__p0 >= __p1);
   1967   return __ret;
   1968 }
   1969 #else
   1970 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcge_f16(float16x4_t __p0, float16x4_t __p1) {
   1971   uint16x4_t __ret;
   1972   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   1973   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   1974   __ret = (uint16x4_t)(__rev0 >= __rev1);
   1975   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   1976   return __ret;
   1977 }
   1978 #endif
   1979 
   1980 #ifdef __LITTLE_ENDIAN__
   1981 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgezq_f16(float16x8_t __p0) {
   1982   uint16x8_t __ret;
   1983   __ret = (uint16x8_t) __builtin_neon_vcgezq_f16((int8x16_t)__p0, 49);
   1984   return __ret;
   1985 }
   1986 #else
   1987 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgezq_f16(float16x8_t __p0) {
   1988   uint16x8_t __ret;
   1989   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   1990   __ret = (uint16x8_t) __builtin_neon_vcgezq_f16((int8x16_t)__rev0, 49);
   1991   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   1992   return __ret;
   1993 }
   1994 #endif
   1995 
   1996 #ifdef __LITTLE_ENDIAN__
   1997 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgez_f16(float16x4_t __p0) {
   1998   uint16x4_t __ret;
   1999   __ret = (uint16x4_t) __builtin_neon_vcgez_f16((int8x8_t)__p0, 17);
   2000   return __ret;
   2001 }
   2002 #else
   2003 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgez_f16(float16x4_t __p0) {
   2004   uint16x4_t __ret;
   2005   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2006   __ret = (uint16x4_t) __builtin_neon_vcgez_f16((int8x8_t)__rev0, 17);
   2007   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2008   return __ret;
   2009 }
   2010 #endif
   2011 
   2012 #ifdef __LITTLE_ENDIAN__
   2013 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtq_f16(float16x8_t __p0, float16x8_t __p1) {
   2014   uint16x8_t __ret;
   2015   __ret = (uint16x8_t)(__p0 > __p1);
   2016   return __ret;
   2017 }
   2018 #else
   2019 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtq_f16(float16x8_t __p0, float16x8_t __p1) {
   2020   uint16x8_t __ret;
   2021   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2022   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2023   __ret = (uint16x8_t)(__rev0 > __rev1);
   2024   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2025   return __ret;
   2026 }
   2027 #endif
   2028 
   2029 #ifdef __LITTLE_ENDIAN__
   2030 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgt_f16(float16x4_t __p0, float16x4_t __p1) {
   2031   uint16x4_t __ret;
   2032   __ret = (uint16x4_t)(__p0 > __p1);
   2033   return __ret;
   2034 }
   2035 #else
   2036 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgt_f16(float16x4_t __p0, float16x4_t __p1) {
   2037   uint16x4_t __ret;
   2038   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2039   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2040   __ret = (uint16x4_t)(__rev0 > __rev1);
   2041   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2042   return __ret;
   2043 }
   2044 #endif
   2045 
   2046 #ifdef __LITTLE_ENDIAN__
   2047 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtzq_f16(float16x8_t __p0) {
   2048   uint16x8_t __ret;
   2049   __ret = (uint16x8_t) __builtin_neon_vcgtzq_f16((int8x16_t)__p0, 49);
   2050   return __ret;
   2051 }
   2052 #else
   2053 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtzq_f16(float16x8_t __p0) {
   2054   uint16x8_t __ret;
   2055   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2056   __ret = (uint16x8_t) __builtin_neon_vcgtzq_f16((int8x16_t)__rev0, 49);
   2057   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2058   return __ret;
   2059 }
   2060 #endif
   2061 
   2062 #ifdef __LITTLE_ENDIAN__
   2063 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgtz_f16(float16x4_t __p0) {
   2064   uint16x4_t __ret;
   2065   __ret = (uint16x4_t) __builtin_neon_vcgtz_f16((int8x8_t)__p0, 17);
   2066   return __ret;
   2067 }
   2068 #else
   2069 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgtz_f16(float16x4_t __p0) {
   2070   uint16x4_t __ret;
   2071   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2072   __ret = (uint16x4_t) __builtin_neon_vcgtz_f16((int8x8_t)__rev0, 17);
   2073   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2074   return __ret;
   2075 }
   2076 #endif
   2077 
   2078 #ifdef __LITTLE_ENDIAN__
   2079 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcleq_f16(float16x8_t __p0, float16x8_t __p1) {
   2080   uint16x8_t __ret;
   2081   __ret = (uint16x8_t)(__p0 <= __p1);
   2082   return __ret;
   2083 }
   2084 #else
   2085 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcleq_f16(float16x8_t __p0, float16x8_t __p1) {
   2086   uint16x8_t __ret;
   2087   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2088   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2089   __ret = (uint16x8_t)(__rev0 <= __rev1);
   2090   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2091   return __ret;
   2092 }
   2093 #endif
   2094 
   2095 #ifdef __LITTLE_ENDIAN__
   2096 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcle_f16(float16x4_t __p0, float16x4_t __p1) {
   2097   uint16x4_t __ret;
   2098   __ret = (uint16x4_t)(__p0 <= __p1);
   2099   return __ret;
   2100 }
   2101 #else
   2102 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcle_f16(float16x4_t __p0, float16x4_t __p1) {
   2103   uint16x4_t __ret;
   2104   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2105   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2106   __ret = (uint16x4_t)(__rev0 <= __rev1);
   2107   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2108   return __ret;
   2109 }
   2110 #endif
   2111 
   2112 #ifdef __LITTLE_ENDIAN__
   2113 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vclezq_f16(float16x8_t __p0) {
   2114   uint16x8_t __ret;
   2115   __ret = (uint16x8_t) __builtin_neon_vclezq_f16((int8x16_t)__p0, 49);
   2116   return __ret;
   2117 }
   2118 #else
   2119 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vclezq_f16(float16x8_t __p0) {
   2120   uint16x8_t __ret;
   2121   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2122   __ret = (uint16x8_t) __builtin_neon_vclezq_f16((int8x16_t)__rev0, 49);
   2123   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2124   return __ret;
   2125 }
   2126 #endif
   2127 
   2128 #ifdef __LITTLE_ENDIAN__
   2129 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclez_f16(float16x4_t __p0) {
   2130   uint16x4_t __ret;
   2131   __ret = (uint16x4_t) __builtin_neon_vclez_f16((int8x8_t)__p0, 17);
   2132   return __ret;
   2133 }
   2134 #else
   2135 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclez_f16(float16x4_t __p0) {
   2136   uint16x4_t __ret;
   2137   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2138   __ret = (uint16x4_t) __builtin_neon_vclez_f16((int8x8_t)__rev0, 17);
   2139   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2140   return __ret;
   2141 }
   2142 #endif
   2143 
   2144 #ifdef __LITTLE_ENDIAN__
   2145 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltq_f16(float16x8_t __p0, float16x8_t __p1) {
   2146   uint16x8_t __ret;
   2147   __ret = (uint16x8_t)(__p0 < __p1);
   2148   return __ret;
   2149 }
   2150 #else
   2151 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltq_f16(float16x8_t __p0, float16x8_t __p1) {
   2152   uint16x8_t __ret;
   2153   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2154   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2155   __ret = (uint16x8_t)(__rev0 < __rev1);
   2156   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2157   return __ret;
   2158 }
   2159 #endif
   2160 
   2161 #ifdef __LITTLE_ENDIAN__
   2162 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclt_f16(float16x4_t __p0, float16x4_t __p1) {
   2163   uint16x4_t __ret;
   2164   __ret = (uint16x4_t)(__p0 < __p1);
   2165   return __ret;
   2166 }
   2167 #else
   2168 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclt_f16(float16x4_t __p0, float16x4_t __p1) {
   2169   uint16x4_t __ret;
   2170   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2171   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2172   __ret = (uint16x4_t)(__rev0 < __rev1);
   2173   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2174   return __ret;
   2175 }
   2176 #endif
   2177 
   2178 #ifdef __LITTLE_ENDIAN__
   2179 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltzq_f16(float16x8_t __p0) {
   2180   uint16x8_t __ret;
   2181   __ret = (uint16x8_t) __builtin_neon_vcltzq_f16((int8x16_t)__p0, 49);
   2182   return __ret;
   2183 }
   2184 #else
   2185 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltzq_f16(float16x8_t __p0) {
   2186   uint16x8_t __ret;
   2187   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2188   __ret = (uint16x8_t) __builtin_neon_vcltzq_f16((int8x16_t)__rev0, 49);
   2189   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2190   return __ret;
   2191 }
   2192 #endif
   2193 
   2194 #ifdef __LITTLE_ENDIAN__
   2195 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcltz_f16(float16x4_t __p0) {
   2196   uint16x4_t __ret;
   2197   __ret = (uint16x4_t) __builtin_neon_vcltz_f16((int8x8_t)__p0, 17);
   2198   return __ret;
   2199 }
   2200 #else
   2201 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcltz_f16(float16x4_t __p0) {
   2202   uint16x4_t __ret;
   2203   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2204   __ret = (uint16x4_t) __builtin_neon_vcltz_f16((int8x8_t)__rev0, 17);
   2205   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2206   return __ret;
   2207 }
   2208 #endif
   2209 
   2210 #ifdef __LITTLE_ENDIAN__
   2211 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_u16(uint16x8_t __p0) {
   2212   float16x8_t __ret;
   2213   __ret = (float16x8_t) __builtin_neon_vcvtq_f16_u16((int8x16_t)__p0, 49);
   2214   return __ret;
   2215 }
   2216 #else
   2217 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_u16(uint16x8_t __p0) {
   2218   float16x8_t __ret;
   2219   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2220   __ret = (float16x8_t) __builtin_neon_vcvtq_f16_u16((int8x16_t)__rev0, 49);
   2221   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2222   return __ret;
   2223 }
   2224 #endif
   2225 
   2226 #ifdef __LITTLE_ENDIAN__
   2227 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_s16(int16x8_t __p0) {
   2228   float16x8_t __ret;
   2229   __ret = (float16x8_t) __builtin_neon_vcvtq_f16_s16((int8x16_t)__p0, 33);
   2230   return __ret;
   2231 }
   2232 #else
   2233 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_s16(int16x8_t __p0) {
   2234   float16x8_t __ret;
   2235   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2236   __ret = (float16x8_t) __builtin_neon_vcvtq_f16_s16((int8x16_t)__rev0, 33);
   2237   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2238   return __ret;
   2239 }
   2240 #endif
   2241 
   2242 #ifdef __LITTLE_ENDIAN__
   2243 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_u16(uint16x4_t __p0) {
   2244   float16x4_t __ret;
   2245   __ret = (float16x4_t) __builtin_neon_vcvt_f16_u16((int8x8_t)__p0, 17);
   2246   return __ret;
   2247 }
   2248 #else
   2249 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_u16(uint16x4_t __p0) {
   2250   float16x4_t __ret;
   2251   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2252   __ret = (float16x4_t) __builtin_neon_vcvt_f16_u16((int8x8_t)__rev0, 17);
   2253   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2254   return __ret;
   2255 }
   2256 #endif
   2257 
   2258 #ifdef __LITTLE_ENDIAN__
   2259 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_s16(int16x4_t __p0) {
   2260   float16x4_t __ret;
   2261   __ret = (float16x4_t) __builtin_neon_vcvt_f16_s16((int8x8_t)__p0, 1);
   2262   return __ret;
   2263 }
   2264 #else
   2265 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_s16(int16x4_t __p0) {
   2266   float16x4_t __ret;
   2267   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2268   __ret = (float16x4_t) __builtin_neon_vcvt_f16_s16((int8x8_t)__rev0, 1);
   2269   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2270   return __ret;
   2271 }
   2272 #endif
   2273 
   2274 #ifdef __LITTLE_ENDIAN__
   2275 #define vcvtq_n_f16_u16(__p0, __p1) __extension__ ({ \
   2276   float16x8_t __ret; \
   2277   uint16x8_t __s0 = __p0; \
   2278   __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_u16((int8x16_t)__s0, __p1, 49); \
   2279   __ret; \
   2280 })
   2281 #else
   2282 #define vcvtq_n_f16_u16(__p0, __p1) __extension__ ({ \
   2283   float16x8_t __ret; \
   2284   uint16x8_t __s0 = __p0; \
   2285   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   2286   __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_u16((int8x16_t)__rev0, __p1, 49); \
   2287   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   2288   __ret; \
   2289 })
   2290 #endif
   2291 
   2292 #ifdef __LITTLE_ENDIAN__
   2293 #define vcvtq_n_f16_s16(__p0, __p1) __extension__ ({ \
   2294   float16x8_t __ret; \
   2295   int16x8_t __s0 = __p0; \
   2296   __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_s16((int8x16_t)__s0, __p1, 33); \
   2297   __ret; \
   2298 })
   2299 #else
   2300 #define vcvtq_n_f16_s16(__p0, __p1) __extension__ ({ \
   2301   float16x8_t __ret; \
   2302   int16x8_t __s0 = __p0; \
   2303   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   2304   __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_s16((int8x16_t)__rev0, __p1, 33); \
   2305   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   2306   __ret; \
   2307 })
   2308 #endif
   2309 
   2310 #ifdef __LITTLE_ENDIAN__
   2311 #define vcvt_n_f16_u16(__p0, __p1) __extension__ ({ \
   2312   float16x4_t __ret; \
   2313   uint16x4_t __s0 = __p0; \
   2314   __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_u16((int8x8_t)__s0, __p1, 17); \
   2315   __ret; \
   2316 })
   2317 #else
   2318 #define vcvt_n_f16_u16(__p0, __p1) __extension__ ({ \
   2319   float16x4_t __ret; \
   2320   uint16x4_t __s0 = __p0; \
   2321   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   2322   __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_u16((int8x8_t)__rev0, __p1, 17); \
   2323   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   2324   __ret; \
   2325 })
   2326 #endif
   2327 
   2328 #ifdef __LITTLE_ENDIAN__
   2329 #define vcvt_n_f16_s16(__p0, __p1) __extension__ ({ \
   2330   float16x4_t __ret; \
   2331   int16x4_t __s0 = __p0; \
   2332   __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_s16((int8x8_t)__s0, __p1, 1); \
   2333   __ret; \
   2334 })
   2335 #else
   2336 #define vcvt_n_f16_s16(__p0, __p1) __extension__ ({ \
   2337   float16x4_t __ret; \
   2338   int16x4_t __s0 = __p0; \
   2339   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   2340   __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_s16((int8x8_t)__rev0, __p1, 1); \
   2341   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   2342   __ret; \
   2343 })
   2344 #endif
   2345 
   2346 #ifdef __LITTLE_ENDIAN__
   2347 #define vcvtq_n_s16_f16(__p0, __p1) __extension__ ({ \
   2348   int16x8_t __ret; \
   2349   float16x8_t __s0 = __p0; \
   2350   __ret = (int16x8_t) __builtin_neon_vcvtq_n_s16_f16((int8x16_t)__s0, __p1, 33); \
   2351   __ret; \
   2352 })
   2353 #else
   2354 #define vcvtq_n_s16_f16(__p0, __p1) __extension__ ({ \
   2355   int16x8_t __ret; \
   2356   float16x8_t __s0 = __p0; \
   2357   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   2358   __ret = (int16x8_t) __builtin_neon_vcvtq_n_s16_f16((int8x16_t)__rev0, __p1, 33); \
   2359   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   2360   __ret; \
   2361 })
   2362 #endif
   2363 
   2364 #ifdef __LITTLE_ENDIAN__
   2365 #define vcvt_n_s16_f16(__p0, __p1) __extension__ ({ \
   2366   int16x4_t __ret; \
   2367   float16x4_t __s0 = __p0; \
   2368   __ret = (int16x4_t) __builtin_neon_vcvt_n_s16_f16((int8x8_t)__s0, __p1, 1); \
   2369   __ret; \
   2370 })
   2371 #else
   2372 #define vcvt_n_s16_f16(__p0, __p1) __extension__ ({ \
   2373   int16x4_t __ret; \
   2374   float16x4_t __s0 = __p0; \
   2375   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   2376   __ret = (int16x4_t) __builtin_neon_vcvt_n_s16_f16((int8x8_t)__rev0, __p1, 1); \
   2377   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   2378   __ret; \
   2379 })
   2380 #endif
   2381 
   2382 #ifdef __LITTLE_ENDIAN__
   2383 #define vcvtq_n_u16_f16(__p0, __p1) __extension__ ({ \
   2384   uint16x8_t __ret; \
   2385   float16x8_t __s0 = __p0; \
   2386   __ret = (uint16x8_t) __builtin_neon_vcvtq_n_u16_f16((int8x16_t)__s0, __p1, 49); \
   2387   __ret; \
   2388 })
   2389 #else
   2390 #define vcvtq_n_u16_f16(__p0, __p1) __extension__ ({ \
   2391   uint16x8_t __ret; \
   2392   float16x8_t __s0 = __p0; \
   2393   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   2394   __ret = (uint16x8_t) __builtin_neon_vcvtq_n_u16_f16((int8x16_t)__rev0, __p1, 49); \
   2395   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   2396   __ret; \
   2397 })
   2398 #endif
   2399 
   2400 #ifdef __LITTLE_ENDIAN__
   2401 #define vcvt_n_u16_f16(__p0, __p1) __extension__ ({ \
   2402   uint16x4_t __ret; \
   2403   float16x4_t __s0 = __p0; \
   2404   __ret = (uint16x4_t) __builtin_neon_vcvt_n_u16_f16((int8x8_t)__s0, __p1, 17); \
   2405   __ret; \
   2406 })
   2407 #else
   2408 #define vcvt_n_u16_f16(__p0, __p1) __extension__ ({ \
   2409   uint16x4_t __ret; \
   2410   float16x4_t __s0 = __p0; \
   2411   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   2412   __ret = (uint16x4_t) __builtin_neon_vcvt_n_u16_f16((int8x8_t)__rev0, __p1, 17); \
   2413   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   2414   __ret; \
   2415 })
   2416 #endif
   2417 
   2418 #ifdef __LITTLE_ENDIAN__
   2419 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtq_s16_f16(float16x8_t __p0) {
   2420   int16x8_t __ret;
   2421   __ret = (int16x8_t) __builtin_neon_vcvtq_s16_f16((int8x16_t)__p0, 33);
   2422   return __ret;
   2423 }
   2424 #else
   2425 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtq_s16_f16(float16x8_t __p0) {
   2426   int16x8_t __ret;
   2427   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2428   __ret = (int16x8_t) __builtin_neon_vcvtq_s16_f16((int8x16_t)__rev0, 33);
   2429   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2430   return __ret;
   2431 }
   2432 #endif
   2433 
   2434 #ifdef __LITTLE_ENDIAN__
   2435 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvt_s16_f16(float16x4_t __p0) {
   2436   int16x4_t __ret;
   2437   __ret = (int16x4_t) __builtin_neon_vcvt_s16_f16((int8x8_t)__p0, 1);
   2438   return __ret;
   2439 }
   2440 #else
   2441 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvt_s16_f16(float16x4_t __p0) {
   2442   int16x4_t __ret;
   2443   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2444   __ret = (int16x4_t) __builtin_neon_vcvt_s16_f16((int8x8_t)__rev0, 1);
   2445   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2446   return __ret;
   2447 }
   2448 #endif
   2449 
   2450 #ifdef __LITTLE_ENDIAN__
   2451 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtq_u16_f16(float16x8_t __p0) {
   2452   uint16x8_t __ret;
   2453   __ret = (uint16x8_t) __builtin_neon_vcvtq_u16_f16((int8x16_t)__p0, 49);
   2454   return __ret;
   2455 }
   2456 #else
   2457 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtq_u16_f16(float16x8_t __p0) {
   2458   uint16x8_t __ret;
   2459   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2460   __ret = (uint16x8_t) __builtin_neon_vcvtq_u16_f16((int8x16_t)__rev0, 49);
   2461   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2462   return __ret;
   2463 }
   2464 #endif
   2465 
   2466 #ifdef __LITTLE_ENDIAN__
   2467 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvt_u16_f16(float16x4_t __p0) {
   2468   uint16x4_t __ret;
   2469   __ret = (uint16x4_t) __builtin_neon_vcvt_u16_f16((int8x8_t)__p0, 17);
   2470   return __ret;
   2471 }
   2472 #else
   2473 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvt_u16_f16(float16x4_t __p0) {
   2474   uint16x4_t __ret;
   2475   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2476   __ret = (uint16x4_t) __builtin_neon_vcvt_u16_f16((int8x8_t)__rev0, 17);
   2477   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2478   return __ret;
   2479 }
   2480 #endif
   2481 
   2482 #ifdef __LITTLE_ENDIAN__
   2483 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtaq_s16_f16(float16x8_t __p0) {
   2484   int16x8_t __ret;
   2485   __ret = (int16x8_t) __builtin_neon_vcvtaq_s16_f16((int8x16_t)__p0, 33);
   2486   return __ret;
   2487 }
   2488 #else
   2489 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtaq_s16_f16(float16x8_t __p0) {
   2490   int16x8_t __ret;
   2491   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2492   __ret = (int16x8_t) __builtin_neon_vcvtaq_s16_f16((int8x16_t)__rev0, 33);
   2493   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2494   return __ret;
   2495 }
   2496 #endif
   2497 
   2498 #ifdef __LITTLE_ENDIAN__
   2499 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvta_s16_f16(float16x4_t __p0) {
   2500   int16x4_t __ret;
   2501   __ret = (int16x4_t) __builtin_neon_vcvta_s16_f16((int8x8_t)__p0, 1);
   2502   return __ret;
   2503 }
   2504 #else
   2505 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvta_s16_f16(float16x4_t __p0) {
   2506   int16x4_t __ret;
   2507   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2508   __ret = (int16x4_t) __builtin_neon_vcvta_s16_f16((int8x8_t)__rev0, 1);
   2509   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2510   return __ret;
   2511 }
   2512 #endif
   2513 
   2514 #ifdef __LITTLE_ENDIAN__
   2515 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtaq_u16_f16(float16x8_t __p0) {
   2516   uint16x8_t __ret;
   2517   __ret = (uint16x8_t) __builtin_neon_vcvtaq_u16_f16((int8x16_t)__p0, 49);
   2518   return __ret;
   2519 }
   2520 #else
   2521 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtaq_u16_f16(float16x8_t __p0) {
   2522   uint16x8_t __ret;
   2523   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2524   __ret = (uint16x8_t) __builtin_neon_vcvtaq_u16_f16((int8x16_t)__rev0, 49);
   2525   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2526   return __ret;
   2527 }
   2528 #endif
   2529 
   2530 #ifdef __LITTLE_ENDIAN__
   2531 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvta_u16_f16(float16x4_t __p0) {
   2532   uint16x4_t __ret;
   2533   __ret = (uint16x4_t) __builtin_neon_vcvta_u16_f16((int8x8_t)__p0, 17);
   2534   return __ret;
   2535 }
   2536 #else
   2537 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvta_u16_f16(float16x4_t __p0) {
   2538   uint16x4_t __ret;
   2539   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2540   __ret = (uint16x4_t) __builtin_neon_vcvta_u16_f16((int8x8_t)__rev0, 17);
   2541   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2542   return __ret;
   2543 }
   2544 #endif
   2545 
   2546 #ifdef __LITTLE_ENDIAN__
   2547 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtmq_s16_f16(float16x8_t __p0) {
   2548   int16x8_t __ret;
   2549   __ret = (int16x8_t) __builtin_neon_vcvtmq_s16_f16((int8x16_t)__p0, 33);
   2550   return __ret;
   2551 }
   2552 #else
   2553 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtmq_s16_f16(float16x8_t __p0) {
   2554   int16x8_t __ret;
   2555   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2556   __ret = (int16x8_t) __builtin_neon_vcvtmq_s16_f16((int8x16_t)__rev0, 33);
   2557   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2558   return __ret;
   2559 }
   2560 #endif
   2561 
   2562 #ifdef __LITTLE_ENDIAN__
   2563 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtm_s16_f16(float16x4_t __p0) {
   2564   int16x4_t __ret;
   2565   __ret = (int16x4_t) __builtin_neon_vcvtm_s16_f16((int8x8_t)__p0, 1);
   2566   return __ret;
   2567 }
   2568 #else
   2569 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtm_s16_f16(float16x4_t __p0) {
   2570   int16x4_t __ret;
   2571   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2572   __ret = (int16x4_t) __builtin_neon_vcvtm_s16_f16((int8x8_t)__rev0, 1);
   2573   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2574   return __ret;
   2575 }
   2576 #endif
   2577 
   2578 #ifdef __LITTLE_ENDIAN__
   2579 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtmq_u16_f16(float16x8_t __p0) {
   2580   uint16x8_t __ret;
   2581   __ret = (uint16x8_t) __builtin_neon_vcvtmq_u16_f16((int8x16_t)__p0, 49);
   2582   return __ret;
   2583 }
   2584 #else
   2585 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtmq_u16_f16(float16x8_t __p0) {
   2586   uint16x8_t __ret;
   2587   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2588   __ret = (uint16x8_t) __builtin_neon_vcvtmq_u16_f16((int8x16_t)__rev0, 49);
   2589   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2590   return __ret;
   2591 }
   2592 #endif
   2593 
   2594 #ifdef __LITTLE_ENDIAN__
   2595 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtm_u16_f16(float16x4_t __p0) {
   2596   uint16x4_t __ret;
   2597   __ret = (uint16x4_t) __builtin_neon_vcvtm_u16_f16((int8x8_t)__p0, 17);
   2598   return __ret;
   2599 }
   2600 #else
   2601 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtm_u16_f16(float16x4_t __p0) {
   2602   uint16x4_t __ret;
   2603   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2604   __ret = (uint16x4_t) __builtin_neon_vcvtm_u16_f16((int8x8_t)__rev0, 17);
   2605   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2606   return __ret;
   2607 }
   2608 #endif
   2609 
   2610 #ifdef __LITTLE_ENDIAN__
   2611 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtnq_s16_f16(float16x8_t __p0) {
   2612   int16x8_t __ret;
   2613   __ret = (int16x8_t) __builtin_neon_vcvtnq_s16_f16((int8x16_t)__p0, 33);
   2614   return __ret;
   2615 }
   2616 #else
   2617 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtnq_s16_f16(float16x8_t __p0) {
   2618   int16x8_t __ret;
   2619   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2620   __ret = (int16x8_t) __builtin_neon_vcvtnq_s16_f16((int8x16_t)__rev0, 33);
   2621   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2622   return __ret;
   2623 }
   2624 #endif
   2625 
   2626 #ifdef __LITTLE_ENDIAN__
   2627 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtn_s16_f16(float16x4_t __p0) {
   2628   int16x4_t __ret;
   2629   __ret = (int16x4_t) __builtin_neon_vcvtn_s16_f16((int8x8_t)__p0, 1);
   2630   return __ret;
   2631 }
   2632 #else
   2633 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtn_s16_f16(float16x4_t __p0) {
   2634   int16x4_t __ret;
   2635   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2636   __ret = (int16x4_t) __builtin_neon_vcvtn_s16_f16((int8x8_t)__rev0, 1);
   2637   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2638   return __ret;
   2639 }
   2640 #endif
   2641 
   2642 #ifdef __LITTLE_ENDIAN__
   2643 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtnq_u16_f16(float16x8_t __p0) {
   2644   uint16x8_t __ret;
   2645   __ret = (uint16x8_t) __builtin_neon_vcvtnq_u16_f16((int8x16_t)__p0, 49);
   2646   return __ret;
   2647 }
   2648 #else
   2649 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtnq_u16_f16(float16x8_t __p0) {
   2650   uint16x8_t __ret;
   2651   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2652   __ret = (uint16x8_t) __builtin_neon_vcvtnq_u16_f16((int8x16_t)__rev0, 49);
   2653   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2654   return __ret;
   2655 }
   2656 #endif
   2657 
   2658 #ifdef __LITTLE_ENDIAN__
   2659 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtn_u16_f16(float16x4_t __p0) {
   2660   uint16x4_t __ret;
   2661   __ret = (uint16x4_t) __builtin_neon_vcvtn_u16_f16((int8x8_t)__p0, 17);
   2662   return __ret;
   2663 }
   2664 #else
   2665 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtn_u16_f16(float16x4_t __p0) {
   2666   uint16x4_t __ret;
   2667   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2668   __ret = (uint16x4_t) __builtin_neon_vcvtn_u16_f16((int8x8_t)__rev0, 17);
   2669   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2670   return __ret;
   2671 }
   2672 #endif
   2673 
   2674 #ifdef __LITTLE_ENDIAN__
   2675 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtpq_s16_f16(float16x8_t __p0) {
   2676   int16x8_t __ret;
   2677   __ret = (int16x8_t) __builtin_neon_vcvtpq_s16_f16((int8x16_t)__p0, 33);
   2678   return __ret;
   2679 }
   2680 #else
   2681 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtpq_s16_f16(float16x8_t __p0) {
   2682   int16x8_t __ret;
   2683   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2684   __ret = (int16x8_t) __builtin_neon_vcvtpq_s16_f16((int8x16_t)__rev0, 33);
   2685   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2686   return __ret;
   2687 }
   2688 #endif
   2689 
   2690 #ifdef __LITTLE_ENDIAN__
   2691 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtp_s16_f16(float16x4_t __p0) {
   2692   int16x4_t __ret;
   2693   __ret = (int16x4_t) __builtin_neon_vcvtp_s16_f16((int8x8_t)__p0, 1);
   2694   return __ret;
   2695 }
   2696 #else
   2697 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtp_s16_f16(float16x4_t __p0) {
   2698   int16x4_t __ret;
   2699   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2700   __ret = (int16x4_t) __builtin_neon_vcvtp_s16_f16((int8x8_t)__rev0, 1);
   2701   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2702   return __ret;
   2703 }
   2704 #endif
   2705 
   2706 #ifdef __LITTLE_ENDIAN__
   2707 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtpq_u16_f16(float16x8_t __p0) {
   2708   uint16x8_t __ret;
   2709   __ret = (uint16x8_t) __builtin_neon_vcvtpq_u16_f16((int8x16_t)__p0, 49);
   2710   return __ret;
   2711 }
   2712 #else
   2713 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtpq_u16_f16(float16x8_t __p0) {
   2714   uint16x8_t __ret;
   2715   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2716   __ret = (uint16x8_t) __builtin_neon_vcvtpq_u16_f16((int8x16_t)__rev0, 49);
   2717   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2718   return __ret;
   2719 }
   2720 #endif
   2721 
   2722 #ifdef __LITTLE_ENDIAN__
   2723 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtp_u16_f16(float16x4_t __p0) {
   2724   uint16x4_t __ret;
   2725   __ret = (uint16x4_t) __builtin_neon_vcvtp_u16_f16((int8x8_t)__p0, 17);
   2726   return __ret;
   2727 }
   2728 #else
   2729 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtp_u16_f16(float16x4_t __p0) {
   2730   uint16x4_t __ret;
   2731   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2732   __ret = (uint16x4_t) __builtin_neon_vcvtp_u16_f16((int8x8_t)__rev0, 17);
   2733   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2734   return __ret;
   2735 }
   2736 #endif
   2737 
   2738 #ifdef __LITTLE_ENDIAN__
   2739 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   2740   float16x8_t __ret;
   2741   __ret = (float16x8_t) __builtin_neon_vfmaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
   2742   return __ret;
   2743 }
   2744 #else
   2745 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   2746   float16x8_t __ret;
   2747   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2748   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2749   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   2750   __ret = (float16x8_t) __builtin_neon_vfmaq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40);
   2751   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2752   return __ret;
   2753 }
   2754 __ai __attribute__((target("fullfp16,neon"))) float16x8_t __noswap_vfmaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   2755   float16x8_t __ret;
   2756   __ret = (float16x8_t) __builtin_neon_vfmaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
   2757   return __ret;
   2758 }
   2759 #endif
   2760 
   2761 #ifdef __LITTLE_ENDIAN__
   2762 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfma_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   2763   float16x4_t __ret;
   2764   __ret = (float16x4_t) __builtin_neon_vfma_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
   2765   return __ret;
   2766 }
   2767 #else
   2768 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfma_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   2769   float16x4_t __ret;
   2770   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2771   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2772   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   2773   __ret = (float16x4_t) __builtin_neon_vfma_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8);
   2774   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2775   return __ret;
   2776 }
   2777 __ai __attribute__((target("fullfp16,neon"))) float16x4_t __noswap_vfma_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   2778   float16x4_t __ret;
   2779   __ret = (float16x4_t) __builtin_neon_vfma_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
   2780   return __ret;
   2781 }
   2782 #endif
   2783 
   2784 #ifdef __LITTLE_ENDIAN__
   2785 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmsq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   2786   float16x8_t __ret;
   2787   __ret = vfmaq_f16(__p0, -__p1, __p2);
   2788   return __ret;
   2789 }
   2790 #else
   2791 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmsq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   2792   float16x8_t __ret;
   2793   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2794   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2795   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   2796   __ret = __noswap_vfmaq_f16(__rev0, -__rev1, __rev2);
   2797   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2798   return __ret;
   2799 }
   2800 #endif
   2801 
   2802 #ifdef __LITTLE_ENDIAN__
   2803 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfms_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   2804   float16x4_t __ret;
   2805   __ret = vfma_f16(__p0, -__p1, __p2);
   2806   return __ret;
   2807 }
   2808 #else
   2809 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfms_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   2810   float16x4_t __ret;
   2811   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2812   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2813   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   2814   __ret = __noswap_vfma_f16(__rev0, -__rev1, __rev2);
   2815   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2816   return __ret;
   2817 }
   2818 #endif
   2819 
   2820 #ifdef __LITTLE_ENDIAN__
   2821 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxq_f16(float16x8_t __p0, float16x8_t __p1) {
   2822   float16x8_t __ret;
   2823   __ret = (float16x8_t) __builtin_neon_vmaxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
   2824   return __ret;
   2825 }
   2826 #else
   2827 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxq_f16(float16x8_t __p0, float16x8_t __p1) {
   2828   float16x8_t __ret;
   2829   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2830   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2831   __ret = (float16x8_t) __builtin_neon_vmaxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
   2832   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2833   return __ret;
   2834 }
   2835 #endif
   2836 
   2837 #ifdef __LITTLE_ENDIAN__
   2838 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmax_f16(float16x4_t __p0, float16x4_t __p1) {
   2839   float16x4_t __ret;
   2840   __ret = (float16x4_t) __builtin_neon_vmax_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   2841   return __ret;
   2842 }
   2843 #else
   2844 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmax_f16(float16x4_t __p0, float16x4_t __p1) {
   2845   float16x4_t __ret;
   2846   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2847   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2848   __ret = (float16x4_t) __builtin_neon_vmax_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   2849   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2850   return __ret;
   2851 }
   2852 #endif
   2853 
   2854 #ifdef __LITTLE_ENDIAN__
   2855 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminq_f16(float16x8_t __p0, float16x8_t __p1) {
   2856   float16x8_t __ret;
   2857   __ret = (float16x8_t) __builtin_neon_vminq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
   2858   return __ret;
   2859 }
   2860 #else
   2861 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminq_f16(float16x8_t __p0, float16x8_t __p1) {
   2862   float16x8_t __ret;
   2863   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2864   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2865   __ret = (float16x8_t) __builtin_neon_vminq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
   2866   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2867   return __ret;
   2868 }
   2869 #endif
   2870 
   2871 #ifdef __LITTLE_ENDIAN__
   2872 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmin_f16(float16x4_t __p0, float16x4_t __p1) {
   2873   float16x4_t __ret;
   2874   __ret = (float16x4_t) __builtin_neon_vmin_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   2875   return __ret;
   2876 }
   2877 #else
   2878 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmin_f16(float16x4_t __p0, float16x4_t __p1) {
   2879   float16x4_t __ret;
   2880   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2881   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2882   __ret = (float16x4_t) __builtin_neon_vmin_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   2883   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2884   return __ret;
   2885 }
   2886 #endif
   2887 
   2888 #ifdef __LITTLE_ENDIAN__
   2889 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulq_f16(float16x8_t __p0, float16x8_t __p1) {
   2890   float16x8_t __ret;
   2891   __ret = __p0 * __p1;
   2892   return __ret;
   2893 }
   2894 #else
   2895 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulq_f16(float16x8_t __p0, float16x8_t __p1) {
   2896   float16x8_t __ret;
   2897   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2898   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   2899   __ret = __rev0 * __rev1;
   2900   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2901   return __ret;
   2902 }
   2903 #endif
   2904 
   2905 #ifdef __LITTLE_ENDIAN__
   2906 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmul_f16(float16x4_t __p0, float16x4_t __p1) {
   2907   float16x4_t __ret;
   2908   __ret = __p0 * __p1;
   2909   return __ret;
   2910 }
   2911 #else
   2912 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmul_f16(float16x4_t __p0, float16x4_t __p1) {
   2913   float16x4_t __ret;
   2914   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2915   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   2916   __ret = __rev0 * __rev1;
   2917   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2918   return __ret;
   2919 }
   2920 #endif
   2921 
   2922 #ifdef __LITTLE_ENDIAN__
   2923 #define vmulq_n_f16(__p0, __p1) __extension__ ({ \
   2924   float16x8_t __ret; \
   2925   float16x8_t __s0 = __p0; \
   2926   float16_t __s1 = __p1; \
   2927   __ret = __s0 * (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}; \
   2928   __ret; \
   2929 })
   2930 #else
   2931 #define vmulq_n_f16(__p0, __p1) __extension__ ({ \
   2932   float16x8_t __ret; \
   2933   float16x8_t __s0 = __p0; \
   2934   float16_t __s1 = __p1; \
   2935   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   2936   __ret = __rev0 * (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}; \
   2937   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   2938   __ret; \
   2939 })
   2940 #endif
   2941 
   2942 #ifdef __LITTLE_ENDIAN__
   2943 #define vmul_n_f16(__p0, __p1) __extension__ ({ \
   2944   float16x4_t __ret; \
   2945   float16x4_t __s0 = __p0; \
   2946   float16_t __s1 = __p1; \
   2947   __ret = __s0 * (float16x4_t) {__s1, __s1, __s1, __s1}; \
   2948   __ret; \
   2949 })
   2950 #else
   2951 #define vmul_n_f16(__p0, __p1) __extension__ ({ \
   2952   float16x4_t __ret; \
   2953   float16x4_t __s0 = __p0; \
   2954   float16_t __s1 = __p1; \
   2955   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   2956   __ret = __rev0 * (float16x4_t) {__s1, __s1, __s1, __s1}; \
   2957   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   2958   __ret; \
   2959 })
   2960 #endif
   2961 
   2962 #ifdef __LITTLE_ENDIAN__
   2963 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vnegq_f16(float16x8_t __p0) {
   2964   float16x8_t __ret;
   2965   __ret = -__p0;
   2966   return __ret;
   2967 }
   2968 #else
   2969 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vnegq_f16(float16x8_t __p0) {
   2970   float16x8_t __ret;
   2971   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   2972   __ret = -__rev0;
   2973   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   2974   return __ret;
   2975 }
   2976 #endif
   2977 
   2978 #ifdef __LITTLE_ENDIAN__
   2979 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vneg_f16(float16x4_t __p0) {
   2980   float16x4_t __ret;
   2981   __ret = -__p0;
   2982   return __ret;
   2983 }
   2984 #else
   2985 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vneg_f16(float16x4_t __p0) {
   2986   float16x4_t __ret;
   2987   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   2988   __ret = -__rev0;
   2989   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   2990   return __ret;
   2991 }
   2992 #endif
   2993 
   2994 #ifdef __LITTLE_ENDIAN__
   2995 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpadd_f16(float16x4_t __p0, float16x4_t __p1) {
   2996   float16x4_t __ret;
   2997   __ret = (float16x4_t) __builtin_neon_vpadd_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   2998   return __ret;
   2999 }
   3000 #else
   3001 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpadd_f16(float16x4_t __p0, float16x4_t __p1) {
   3002   float16x4_t __ret;
   3003   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3004   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   3005   __ret = (float16x4_t) __builtin_neon_vpadd_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   3006   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3007   return __ret;
   3008 }
   3009 #endif
   3010 
   3011 #ifdef __LITTLE_ENDIAN__
   3012 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmax_f16(float16x4_t __p0, float16x4_t __p1) {
   3013   float16x4_t __ret;
   3014   __ret = (float16x4_t) __builtin_neon_vpmax_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   3015   return __ret;
   3016 }
   3017 #else
   3018 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmax_f16(float16x4_t __p0, float16x4_t __p1) {
   3019   float16x4_t __ret;
   3020   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3021   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   3022   __ret = (float16x4_t) __builtin_neon_vpmax_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   3023   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3024   return __ret;
   3025 }
   3026 #endif
   3027 
   3028 #ifdef __LITTLE_ENDIAN__
   3029 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmin_f16(float16x4_t __p0, float16x4_t __p1) {
   3030   float16x4_t __ret;
   3031   __ret = (float16x4_t) __builtin_neon_vpmin_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   3032   return __ret;
   3033 }
   3034 #else
   3035 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmin_f16(float16x4_t __p0, float16x4_t __p1) {
   3036   float16x4_t __ret;
   3037   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3038   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   3039   __ret = (float16x4_t) __builtin_neon_vpmin_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   3040   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3041   return __ret;
   3042 }
   3043 #endif
   3044 
   3045 #ifdef __LITTLE_ENDIAN__
   3046 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpeq_f16(float16x8_t __p0) {
   3047   float16x8_t __ret;
   3048   __ret = (float16x8_t) __builtin_neon_vrecpeq_f16((int8x16_t)__p0, 40);
   3049   return __ret;
   3050 }
   3051 #else
   3052 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpeq_f16(float16x8_t __p0) {
   3053   float16x8_t __ret;
   3054   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   3055   __ret = (float16x8_t) __builtin_neon_vrecpeq_f16((int8x16_t)__rev0, 40);
   3056   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   3057   return __ret;
   3058 }
   3059 #endif
   3060 
   3061 #ifdef __LITTLE_ENDIAN__
   3062 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecpe_f16(float16x4_t __p0) {
   3063   float16x4_t __ret;
   3064   __ret = (float16x4_t) __builtin_neon_vrecpe_f16((int8x8_t)__p0, 8);
   3065   return __ret;
   3066 }
   3067 #else
   3068 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecpe_f16(float16x4_t __p0) {
   3069   float16x4_t __ret;
   3070   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3071   __ret = (float16x4_t) __builtin_neon_vrecpe_f16((int8x8_t)__rev0, 8);
   3072   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3073   return __ret;
   3074 }
   3075 #endif
   3076 
   3077 #ifdef __LITTLE_ENDIAN__
   3078 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpsq_f16(float16x8_t __p0, float16x8_t __p1) {
   3079   float16x8_t __ret;
   3080   __ret = (float16x8_t) __builtin_neon_vrecpsq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
   3081   return __ret;
   3082 }
   3083 #else
   3084 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpsq_f16(float16x8_t __p0, float16x8_t __p1) {
   3085   float16x8_t __ret;
   3086   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   3087   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   3088   __ret = (float16x8_t) __builtin_neon_vrecpsq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
   3089   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   3090   return __ret;
   3091 }
   3092 #endif
   3093 
   3094 #ifdef __LITTLE_ENDIAN__
   3095 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecps_f16(float16x4_t __p0, float16x4_t __p1) {
   3096   float16x4_t __ret;
   3097   __ret = (float16x4_t) __builtin_neon_vrecps_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   3098   return __ret;
   3099 }
   3100 #else
   3101 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecps_f16(float16x4_t __p0, float16x4_t __p1) {
   3102   float16x4_t __ret;
   3103   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3104   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   3105   __ret = (float16x4_t) __builtin_neon_vrecps_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   3106   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3107   return __ret;
   3108 }
   3109 #endif
   3110 
   3111 #ifdef __LITTLE_ENDIAN__
   3112 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrteq_f16(float16x8_t __p0) {
   3113   float16x8_t __ret;
   3114   __ret = (float16x8_t) __builtin_neon_vrsqrteq_f16((int8x16_t)__p0, 40);
   3115   return __ret;
   3116 }
   3117 #else
   3118 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrteq_f16(float16x8_t __p0) {
   3119   float16x8_t __ret;
   3120   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   3121   __ret = (float16x8_t) __builtin_neon_vrsqrteq_f16((int8x16_t)__rev0, 40);
   3122   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   3123   return __ret;
   3124 }
   3125 #endif
   3126 
   3127 #ifdef __LITTLE_ENDIAN__
   3128 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrte_f16(float16x4_t __p0) {
   3129   float16x4_t __ret;
   3130   __ret = (float16x4_t) __builtin_neon_vrsqrte_f16((int8x8_t)__p0, 8);
   3131   return __ret;
   3132 }
   3133 #else
   3134 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrte_f16(float16x4_t __p0) {
   3135   float16x4_t __ret;
   3136   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3137   __ret = (float16x4_t) __builtin_neon_vrsqrte_f16((int8x8_t)__rev0, 8);
   3138   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3139   return __ret;
   3140 }
   3141 #endif
   3142 
   3143 #ifdef __LITTLE_ENDIAN__
   3144 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrtsq_f16(float16x8_t __p0, float16x8_t __p1) {
   3145   float16x8_t __ret;
   3146   __ret = (float16x8_t) __builtin_neon_vrsqrtsq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
   3147   return __ret;
   3148 }
   3149 #else
   3150 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrtsq_f16(float16x8_t __p0, float16x8_t __p1) {
   3151   float16x8_t __ret;
   3152   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   3153   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   3154   __ret = (float16x8_t) __builtin_neon_vrsqrtsq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
   3155   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   3156   return __ret;
   3157 }
   3158 #endif
   3159 
   3160 #ifdef __LITTLE_ENDIAN__
   3161 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrts_f16(float16x4_t __p0, float16x4_t __p1) {
   3162   float16x4_t __ret;
   3163   __ret = (float16x4_t) __builtin_neon_vrsqrts_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
   3164   return __ret;
   3165 }
   3166 #else
   3167 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrts_f16(float16x4_t __p0, float16x4_t __p1) {
   3168   float16x4_t __ret;
   3169   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3170   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   3171   __ret = (float16x4_t) __builtin_neon_vrsqrts_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
   3172   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3173   return __ret;
   3174 }
   3175 #endif
   3176 
   3177 #ifdef __LITTLE_ENDIAN__
   3178 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsubq_f16(float16x8_t __p0, float16x8_t __p1) {
   3179   float16x8_t __ret;
   3180   __ret = __p0 - __p1;
   3181   return __ret;
   3182 }
   3183 #else
   3184 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsubq_f16(float16x8_t __p0, float16x8_t __p1) {
   3185   float16x8_t __ret;
   3186   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   3187   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   3188   __ret = __rev0 - __rev1;
   3189   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   3190   return __ret;
   3191 }
   3192 #endif
   3193 
   3194 #ifdef __LITTLE_ENDIAN__
   3195 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsub_f16(float16x4_t __p0, float16x4_t __p1) {
   3196   float16x4_t __ret;
   3197   __ret = __p0 - __p1;
   3198   return __ret;
   3199 }
   3200 #else
   3201 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsub_f16(float16x4_t __p0, float16x4_t __p1) {
   3202   float16x4_t __ret;
   3203   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3204   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   3205   __ret = __rev0 - __rev1;
   3206   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3207   return __ret;
   3208 }
   3209 #endif
   3210 
   3211 #ifdef __LITTLE_ENDIAN__
   3212 __ai __attribute__((target("i8mm,neon"))) uint32x4_t vmmlaq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   3213   uint32x4_t __ret;
   3214   __ret = (uint32x4_t) __builtin_neon_vmmlaq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
   3215   return __ret;
   3216 }
   3217 #else
   3218 __ai __attribute__((target("i8mm,neon"))) uint32x4_t vmmlaq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   3219   uint32x4_t __ret;
   3220   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3221   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3222   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3223   __ret = (uint32x4_t) __builtin_neon_vmmlaq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
   3224   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3225   return __ret;
   3226 }
   3227 #endif
   3228 
   3229 #ifdef __LITTLE_ENDIAN__
   3230 __ai __attribute__((target("i8mm,neon"))) int32x4_t vmmlaq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) {
   3231   int32x4_t __ret;
   3232   __ret = (int32x4_t) __builtin_neon_vmmlaq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   3233   return __ret;
   3234 }
   3235 #else
   3236 __ai __attribute__((target("i8mm,neon"))) int32x4_t vmmlaq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) {
   3237   int32x4_t __ret;
   3238   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3239   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3240   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3241   __ret = (int32x4_t) __builtin_neon_vmmlaq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
   3242   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3243   return __ret;
   3244 }
   3245 #endif
   3246 
   3247 #ifdef __LITTLE_ENDIAN__
   3248 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusdotq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) {
   3249   int32x4_t __ret;
   3250   __ret = (int32x4_t) __builtin_neon_vusdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   3251   return __ret;
   3252 }
   3253 #else
   3254 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusdotq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) {
   3255   int32x4_t __ret;
   3256   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3257   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3258   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3259   __ret = (int32x4_t) __builtin_neon_vusdotq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
   3260   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3261   return __ret;
   3262 }
   3263 __ai __attribute__((target("i8mm,neon"))) int32x4_t __noswap_vusdotq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) {
   3264   int32x4_t __ret;
   3265   __ret = (int32x4_t) __builtin_neon_vusdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   3266   return __ret;
   3267 }
   3268 #endif
   3269 
   3270 #ifdef __LITTLE_ENDIAN__
   3271 __ai __attribute__((target("i8mm,neon"))) int32x2_t vusdot_s32(int32x2_t __p0, uint8x8_t __p1, int8x8_t __p2) {
   3272   int32x2_t __ret;
   3273   __ret = (int32x2_t) __builtin_neon_vusdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
   3274   return __ret;
   3275 }
   3276 #else
   3277 __ai __attribute__((target("i8mm,neon"))) int32x2_t vusdot_s32(int32x2_t __p0, uint8x8_t __p1, int8x8_t __p2) {
   3278   int32x2_t __ret;
   3279   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   3280   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   3281   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   3282   __ret = (int32x2_t) __builtin_neon_vusdot_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2);
   3283   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   3284   return __ret;
   3285 }
   3286 __ai __attribute__((target("i8mm,neon"))) int32x2_t __noswap_vusdot_s32(int32x2_t __p0, uint8x8_t __p1, int8x8_t __p2) {
   3287   int32x2_t __ret;
   3288   __ret = (int32x2_t) __builtin_neon_vusdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
   3289   return __ret;
   3290 }
   3291 #endif
   3292 
   3293 #ifdef __LITTLE_ENDIAN__
   3294 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusmmlaq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) {
   3295   int32x4_t __ret;
   3296   __ret = (int32x4_t) __builtin_neon_vusmmlaq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   3297   return __ret;
   3298 }
   3299 #else
   3300 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusmmlaq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) {
   3301   int32x4_t __ret;
   3302   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   3303   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3304   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   3305   __ret = (int32x4_t) __builtin_neon_vusmmlaq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
   3306   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   3307   return __ret;
   3308 }
   3309 #endif
   3310 
   3311 #ifdef __LITTLE_ENDIAN__
   3312 #define splat_lane_p8(__p0, __p1) __extension__ ({ \
   3313   poly8x8_t __ret; \
   3314   poly8x8_t __s0 = __p0; \
   3315   __ret = (poly8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 4); \
   3316   __ret; \
   3317 })
   3318 #else
   3319 #define splat_lane_p8(__p0, __p1) __extension__ ({ \
   3320   poly8x8_t __ret; \
   3321   poly8x8_t __s0 = __p0; \
   3322   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3323   __ret = (poly8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 4); \
   3324   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3325   __ret; \
   3326 })
   3327 #define __noswap_splat_lane_p8(__p0, __p1) __extension__ ({ \
   3328   poly8x8_t __ret; \
   3329   poly8x8_t __s0 = __p0; \
   3330   __ret = (poly8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 4); \
   3331   __ret; \
   3332 })
   3333 #endif
   3334 
   3335 #define splat_lane_p64(__p0, __p1) __extension__ ({ \
   3336   poly64x1_t __ret; \
   3337   poly64x1_t __s0 = __p0; \
   3338   __ret = (poly64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 6); \
   3339   __ret; \
   3340 })
   3341 #ifdef __LITTLE_ENDIAN__
   3342 #define splat_lane_p16(__p0, __p1) __extension__ ({ \
   3343   poly16x4_t __ret; \
   3344   poly16x4_t __s0 = __p0; \
   3345   __ret = (poly16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 5); \
   3346   __ret; \
   3347 })
   3348 #else
   3349 #define splat_lane_p16(__p0, __p1) __extension__ ({ \
   3350   poly16x4_t __ret; \
   3351   poly16x4_t __s0 = __p0; \
   3352   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3353   __ret = (poly16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 5); \
   3354   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3355   __ret; \
   3356 })
   3357 #define __noswap_splat_lane_p16(__p0, __p1) __extension__ ({ \
   3358   poly16x4_t __ret; \
   3359   poly16x4_t __s0 = __p0; \
   3360   __ret = (poly16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 5); \
   3361   __ret; \
   3362 })
   3363 #endif
   3364 
   3365 #ifdef __LITTLE_ENDIAN__
   3366 #define splatq_lane_p8(__p0, __p1) __extension__ ({ \
   3367   poly8x16_t __ret; \
   3368   poly8x8_t __s0 = __p0; \
   3369   __ret = (poly8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 4); \
   3370   __ret; \
   3371 })
   3372 #else
   3373 #define splatq_lane_p8(__p0, __p1) __extension__ ({ \
   3374   poly8x16_t __ret; \
   3375   poly8x8_t __s0 = __p0; \
   3376   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3377   __ret = (poly8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 4); \
   3378   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   3379   __ret; \
   3380 })
   3381 #define __noswap_splatq_lane_p8(__p0, __p1) __extension__ ({ \
   3382   poly8x16_t __ret; \
   3383   poly8x8_t __s0 = __p0; \
   3384   __ret = (poly8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 4); \
   3385   __ret; \
   3386 })
   3387 #endif
   3388 
   3389 #ifdef __LITTLE_ENDIAN__
   3390 #define splatq_lane_p64(__p0, __p1) __extension__ ({ \
   3391   poly64x2_t __ret; \
   3392   poly64x1_t __s0 = __p0; \
   3393   __ret = (poly64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 6); \
   3394   __ret; \
   3395 })
   3396 #else
   3397 #define splatq_lane_p64(__p0, __p1) __extension__ ({ \
   3398   poly64x2_t __ret; \
   3399   poly64x1_t __s0 = __p0; \
   3400   __ret = (poly64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 6); \
   3401   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3402   __ret; \
   3403 })
   3404 #define __noswap_splatq_lane_p64(__p0, __p1) __extension__ ({ \
   3405   poly64x2_t __ret; \
   3406   poly64x1_t __s0 = __p0; \
   3407   __ret = (poly64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 6); \
   3408   __ret; \
   3409 })
   3410 #endif
   3411 
   3412 #ifdef __LITTLE_ENDIAN__
   3413 #define splatq_lane_p16(__p0, __p1) __extension__ ({ \
   3414   poly16x8_t __ret; \
   3415   poly16x4_t __s0 = __p0; \
   3416   __ret = (poly16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 5); \
   3417   __ret; \
   3418 })
   3419 #else
   3420 #define splatq_lane_p16(__p0, __p1) __extension__ ({ \
   3421   poly16x8_t __ret; \
   3422   poly16x4_t __s0 = __p0; \
   3423   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3424   __ret = (poly16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 5); \
   3425   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3426   __ret; \
   3427 })
   3428 #define __noswap_splatq_lane_p16(__p0, __p1) __extension__ ({ \
   3429   poly16x8_t __ret; \
   3430   poly16x4_t __s0 = __p0; \
   3431   __ret = (poly16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 5); \
   3432   __ret; \
   3433 })
   3434 #endif
   3435 
   3436 #ifdef __LITTLE_ENDIAN__
   3437 #define splatq_lane_u8(__p0, __p1) __extension__ ({ \
   3438   uint8x16_t __ret; \
   3439   uint8x8_t __s0 = __p0; \
   3440   __ret = (uint8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 16); \
   3441   __ret; \
   3442 })
   3443 #else
   3444 #define splatq_lane_u8(__p0, __p1) __extension__ ({ \
   3445   uint8x16_t __ret; \
   3446   uint8x8_t __s0 = __p0; \
   3447   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3448   __ret = (uint8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 16); \
   3449   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   3450   __ret; \
   3451 })
   3452 #define __noswap_splatq_lane_u8(__p0, __p1) __extension__ ({ \
   3453   uint8x16_t __ret; \
   3454   uint8x8_t __s0 = __p0; \
   3455   __ret = (uint8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 16); \
   3456   __ret; \
   3457 })
   3458 #endif
   3459 
   3460 #ifdef __LITTLE_ENDIAN__
   3461 #define splatq_lane_u32(__p0, __p1) __extension__ ({ \
   3462   uint32x4_t __ret; \
   3463   uint32x2_t __s0 = __p0; \
   3464   __ret = (uint32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 18); \
   3465   __ret; \
   3466 })
   3467 #else
   3468 #define splatq_lane_u32(__p0, __p1) __extension__ ({ \
   3469   uint32x4_t __ret; \
   3470   uint32x2_t __s0 = __p0; \
   3471   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3472   __ret = (uint32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 18); \
   3473   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3474   __ret; \
   3475 })
   3476 #define __noswap_splatq_lane_u32(__p0, __p1) __extension__ ({ \
   3477   uint32x4_t __ret; \
   3478   uint32x2_t __s0 = __p0; \
   3479   __ret = (uint32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 18); \
   3480   __ret; \
   3481 })
   3482 #endif
   3483 
   3484 #ifdef __LITTLE_ENDIAN__
   3485 #define splatq_lane_u64(__p0, __p1) __extension__ ({ \
   3486   uint64x2_t __ret; \
   3487   uint64x1_t __s0 = __p0; \
   3488   __ret = (uint64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 19); \
   3489   __ret; \
   3490 })
   3491 #else
   3492 #define splatq_lane_u64(__p0, __p1) __extension__ ({ \
   3493   uint64x2_t __ret; \
   3494   uint64x1_t __s0 = __p0; \
   3495   __ret = (uint64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 19); \
   3496   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3497   __ret; \
   3498 })
   3499 #define __noswap_splatq_lane_u64(__p0, __p1) __extension__ ({ \
   3500   uint64x2_t __ret; \
   3501   uint64x1_t __s0 = __p0; \
   3502   __ret = (uint64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 19); \
   3503   __ret; \
   3504 })
   3505 #endif
   3506 
   3507 #ifdef __LITTLE_ENDIAN__
   3508 #define splatq_lane_u16(__p0, __p1) __extension__ ({ \
   3509   uint16x8_t __ret; \
   3510   uint16x4_t __s0 = __p0; \
   3511   __ret = (uint16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 17); \
   3512   __ret; \
   3513 })
   3514 #else
   3515 #define splatq_lane_u16(__p0, __p1) __extension__ ({ \
   3516   uint16x8_t __ret; \
   3517   uint16x4_t __s0 = __p0; \
   3518   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3519   __ret = (uint16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 17); \
   3520   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3521   __ret; \
   3522 })
   3523 #define __noswap_splatq_lane_u16(__p0, __p1) __extension__ ({ \
   3524   uint16x8_t __ret; \
   3525   uint16x4_t __s0 = __p0; \
   3526   __ret = (uint16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 17); \
   3527   __ret; \
   3528 })
   3529 #endif
   3530 
   3531 #ifdef __LITTLE_ENDIAN__
   3532 #define splatq_lane_s8(__p0, __p1) __extension__ ({ \
   3533   int8x16_t __ret; \
   3534   int8x8_t __s0 = __p0; \
   3535   __ret = (int8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 0); \
   3536   __ret; \
   3537 })
   3538 #else
   3539 #define splatq_lane_s8(__p0, __p1) __extension__ ({ \
   3540   int8x16_t __ret; \
   3541   int8x8_t __s0 = __p0; \
   3542   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3543   __ret = (int8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 0); \
   3544   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   3545   __ret; \
   3546 })
   3547 #define __noswap_splatq_lane_s8(__p0, __p1) __extension__ ({ \
   3548   int8x16_t __ret; \
   3549   int8x8_t __s0 = __p0; \
   3550   __ret = (int8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 0); \
   3551   __ret; \
   3552 })
   3553 #endif
   3554 
   3555 #ifdef __LITTLE_ENDIAN__
   3556 #define splatq_lane_f64(__p0, __p1) __extension__ ({ \
   3557   float64x2_t __ret; \
   3558   float64x1_t __s0 = __p0; \
   3559   __ret = (float64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 10); \
   3560   __ret; \
   3561 })
   3562 #else
   3563 #define splatq_lane_f64(__p0, __p1) __extension__ ({ \
   3564   float64x2_t __ret; \
   3565   float64x1_t __s0 = __p0; \
   3566   __ret = (float64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 10); \
   3567   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3568   __ret; \
   3569 })
   3570 #define __noswap_splatq_lane_f64(__p0, __p1) __extension__ ({ \
   3571   float64x2_t __ret; \
   3572   float64x1_t __s0 = __p0; \
   3573   __ret = (float64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 10); \
   3574   __ret; \
   3575 })
   3576 #endif
   3577 
   3578 #ifdef __LITTLE_ENDIAN__
   3579 #define splatq_lane_f32(__p0, __p1) __extension__ ({ \
   3580   float32x4_t __ret; \
   3581   float32x2_t __s0 = __p0; \
   3582   __ret = (float32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 9); \
   3583   __ret; \
   3584 })
   3585 #else
   3586 #define splatq_lane_f32(__p0, __p1) __extension__ ({ \
   3587   float32x4_t __ret; \
   3588   float32x2_t __s0 = __p0; \
   3589   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3590   __ret = (float32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 9); \
   3591   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3592   __ret; \
   3593 })
   3594 #define __noswap_splatq_lane_f32(__p0, __p1) __extension__ ({ \
   3595   float32x4_t __ret; \
   3596   float32x2_t __s0 = __p0; \
   3597   __ret = (float32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 9); \
   3598   __ret; \
   3599 })
   3600 #endif
   3601 
   3602 #ifdef __LITTLE_ENDIAN__
   3603 #define splatq_lane_f16(__p0, __p1) __extension__ ({ \
   3604   float16x8_t __ret; \
   3605   float16x4_t __s0 = __p0; \
   3606   __ret = (float16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 8); \
   3607   __ret; \
   3608 })
   3609 #else
   3610 #define splatq_lane_f16(__p0, __p1) __extension__ ({ \
   3611   float16x8_t __ret; \
   3612   float16x4_t __s0 = __p0; \
   3613   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3614   __ret = (float16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 8); \
   3615   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3616   __ret; \
   3617 })
   3618 #define __noswap_splatq_lane_f16(__p0, __p1) __extension__ ({ \
   3619   float16x8_t __ret; \
   3620   float16x4_t __s0 = __p0; \
   3621   __ret = (float16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 8); \
   3622   __ret; \
   3623 })
   3624 #endif
   3625 
   3626 #ifdef __LITTLE_ENDIAN__
   3627 #define splatq_lane_s32(__p0, __p1) __extension__ ({ \
   3628   int32x4_t __ret; \
   3629   int32x2_t __s0 = __p0; \
   3630   __ret = (int32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 2); \
   3631   __ret; \
   3632 })
   3633 #else
   3634 #define splatq_lane_s32(__p0, __p1) __extension__ ({ \
   3635   int32x4_t __ret; \
   3636   int32x2_t __s0 = __p0; \
   3637   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3638   __ret = (int32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 2); \
   3639   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3640   __ret; \
   3641 })
   3642 #define __noswap_splatq_lane_s32(__p0, __p1) __extension__ ({ \
   3643   int32x4_t __ret; \
   3644   int32x2_t __s0 = __p0; \
   3645   __ret = (int32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 2); \
   3646   __ret; \
   3647 })
   3648 #endif
   3649 
   3650 #ifdef __LITTLE_ENDIAN__
   3651 #define splatq_lane_s64(__p0, __p1) __extension__ ({ \
   3652   int64x2_t __ret; \
   3653   int64x1_t __s0 = __p0; \
   3654   __ret = (int64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 3); \
   3655   __ret; \
   3656 })
   3657 #else
   3658 #define splatq_lane_s64(__p0, __p1) __extension__ ({ \
   3659   int64x2_t __ret; \
   3660   int64x1_t __s0 = __p0; \
   3661   __ret = (int64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 3); \
   3662   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3663   __ret; \
   3664 })
   3665 #define __noswap_splatq_lane_s64(__p0, __p1) __extension__ ({ \
   3666   int64x2_t __ret; \
   3667   int64x1_t __s0 = __p0; \
   3668   __ret = (int64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 3); \
   3669   __ret; \
   3670 })
   3671 #endif
   3672 
   3673 #ifdef __LITTLE_ENDIAN__
   3674 #define splatq_lane_s16(__p0, __p1) __extension__ ({ \
   3675   int16x8_t __ret; \
   3676   int16x4_t __s0 = __p0; \
   3677   __ret = (int16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 1); \
   3678   __ret; \
   3679 })
   3680 #else
   3681 #define splatq_lane_s16(__p0, __p1) __extension__ ({ \
   3682   int16x8_t __ret; \
   3683   int16x4_t __s0 = __p0; \
   3684   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3685   __ret = (int16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 1); \
   3686   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3687   __ret; \
   3688 })
   3689 #define __noswap_splatq_lane_s16(__p0, __p1) __extension__ ({ \
   3690   int16x8_t __ret; \
   3691   int16x4_t __s0 = __p0; \
   3692   __ret = (int16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 1); \
   3693   __ret; \
   3694 })
   3695 #endif
   3696 
   3697 #ifdef __LITTLE_ENDIAN__
   3698 #define splat_lane_u8(__p0, __p1) __extension__ ({ \
   3699   uint8x8_t __ret; \
   3700   uint8x8_t __s0 = __p0; \
   3701   __ret = (uint8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 16); \
   3702   __ret; \
   3703 })
   3704 #else
   3705 #define splat_lane_u8(__p0, __p1) __extension__ ({ \
   3706   uint8x8_t __ret; \
   3707   uint8x8_t __s0 = __p0; \
   3708   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3709   __ret = (uint8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 16); \
   3710   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3711   __ret; \
   3712 })
   3713 #define __noswap_splat_lane_u8(__p0, __p1) __extension__ ({ \
   3714   uint8x8_t __ret; \
   3715   uint8x8_t __s0 = __p0; \
   3716   __ret = (uint8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 16); \
   3717   __ret; \
   3718 })
   3719 #endif
   3720 
   3721 #ifdef __LITTLE_ENDIAN__
   3722 #define splat_lane_u32(__p0, __p1) __extension__ ({ \
   3723   uint32x2_t __ret; \
   3724   uint32x2_t __s0 = __p0; \
   3725   __ret = (uint32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 18); \
   3726   __ret; \
   3727 })
   3728 #else
   3729 #define splat_lane_u32(__p0, __p1) __extension__ ({ \
   3730   uint32x2_t __ret; \
   3731   uint32x2_t __s0 = __p0; \
   3732   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3733   __ret = (uint32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 18); \
   3734   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3735   __ret; \
   3736 })
   3737 #define __noswap_splat_lane_u32(__p0, __p1) __extension__ ({ \
   3738   uint32x2_t __ret; \
   3739   uint32x2_t __s0 = __p0; \
   3740   __ret = (uint32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 18); \
   3741   __ret; \
   3742 })
   3743 #endif
   3744 
   3745 #define splat_lane_u64(__p0, __p1) __extension__ ({ \
   3746   uint64x1_t __ret; \
   3747   uint64x1_t __s0 = __p0; \
   3748   __ret = (uint64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 19); \
   3749   __ret; \
   3750 })
   3751 #ifdef __LITTLE_ENDIAN__
   3752 #define splat_lane_u16(__p0, __p1) __extension__ ({ \
   3753   uint16x4_t __ret; \
   3754   uint16x4_t __s0 = __p0; \
   3755   __ret = (uint16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 17); \
   3756   __ret; \
   3757 })
   3758 #else
   3759 #define splat_lane_u16(__p0, __p1) __extension__ ({ \
   3760   uint16x4_t __ret; \
   3761   uint16x4_t __s0 = __p0; \
   3762   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3763   __ret = (uint16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 17); \
   3764   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3765   __ret; \
   3766 })
   3767 #define __noswap_splat_lane_u16(__p0, __p1) __extension__ ({ \
   3768   uint16x4_t __ret; \
   3769   uint16x4_t __s0 = __p0; \
   3770   __ret = (uint16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 17); \
   3771   __ret; \
   3772 })
   3773 #endif
   3774 
   3775 #ifdef __LITTLE_ENDIAN__
   3776 #define splat_lane_s8(__p0, __p1) __extension__ ({ \
   3777   int8x8_t __ret; \
   3778   int8x8_t __s0 = __p0; \
   3779   __ret = (int8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 0); \
   3780   __ret; \
   3781 })
   3782 #else
   3783 #define splat_lane_s8(__p0, __p1) __extension__ ({ \
   3784   int8x8_t __ret; \
   3785   int8x8_t __s0 = __p0; \
   3786   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3787   __ret = (int8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 0); \
   3788   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3789   __ret; \
   3790 })
   3791 #define __noswap_splat_lane_s8(__p0, __p1) __extension__ ({ \
   3792   int8x8_t __ret; \
   3793   int8x8_t __s0 = __p0; \
   3794   __ret = (int8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 0); \
   3795   __ret; \
   3796 })
   3797 #endif
   3798 
   3799 #define splat_lane_f64(__p0, __p1) __extension__ ({ \
   3800   float64x1_t __ret; \
   3801   float64x1_t __s0 = __p0; \
   3802   __ret = (float64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 10); \
   3803   __ret; \
   3804 })
   3805 #ifdef __LITTLE_ENDIAN__
   3806 #define splat_lane_f32(__p0, __p1) __extension__ ({ \
   3807   float32x2_t __ret; \
   3808   float32x2_t __s0 = __p0; \
   3809   __ret = (float32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 9); \
   3810   __ret; \
   3811 })
   3812 #else
   3813 #define splat_lane_f32(__p0, __p1) __extension__ ({ \
   3814   float32x2_t __ret; \
   3815   float32x2_t __s0 = __p0; \
   3816   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3817   __ret = (float32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 9); \
   3818   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3819   __ret; \
   3820 })
   3821 #define __noswap_splat_lane_f32(__p0, __p1) __extension__ ({ \
   3822   float32x2_t __ret; \
   3823   float32x2_t __s0 = __p0; \
   3824   __ret = (float32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 9); \
   3825   __ret; \
   3826 })
   3827 #endif
   3828 
   3829 #ifdef __LITTLE_ENDIAN__
   3830 #define splat_lane_f16(__p0, __p1) __extension__ ({ \
   3831   float16x4_t __ret; \
   3832   float16x4_t __s0 = __p0; \
   3833   __ret = (float16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 8); \
   3834   __ret; \
   3835 })
   3836 #else
   3837 #define splat_lane_f16(__p0, __p1) __extension__ ({ \
   3838   float16x4_t __ret; \
   3839   float16x4_t __s0 = __p0; \
   3840   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3841   __ret = (float16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 8); \
   3842   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3843   __ret; \
   3844 })
   3845 #define __noswap_splat_lane_f16(__p0, __p1) __extension__ ({ \
   3846   float16x4_t __ret; \
   3847   float16x4_t __s0 = __p0; \
   3848   __ret = (float16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 8); \
   3849   __ret; \
   3850 })
   3851 #endif
   3852 
   3853 #ifdef __LITTLE_ENDIAN__
   3854 #define splat_lane_s32(__p0, __p1) __extension__ ({ \
   3855   int32x2_t __ret; \
   3856   int32x2_t __s0 = __p0; \
   3857   __ret = (int32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 2); \
   3858   __ret; \
   3859 })
   3860 #else
   3861 #define splat_lane_s32(__p0, __p1) __extension__ ({ \
   3862   int32x2_t __ret; \
   3863   int32x2_t __s0 = __p0; \
   3864   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3865   __ret = (int32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 2); \
   3866   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   3867   __ret; \
   3868 })
   3869 #define __noswap_splat_lane_s32(__p0, __p1) __extension__ ({ \
   3870   int32x2_t __ret; \
   3871   int32x2_t __s0 = __p0; \
   3872   __ret = (int32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 2); \
   3873   __ret; \
   3874 })
   3875 #endif
   3876 
   3877 #define splat_lane_s64(__p0, __p1) __extension__ ({ \
   3878   int64x1_t __ret; \
   3879   int64x1_t __s0 = __p0; \
   3880   __ret = (int64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 3); \
   3881   __ret; \
   3882 })
   3883 #ifdef __LITTLE_ENDIAN__
   3884 #define splat_lane_s16(__p0, __p1) __extension__ ({ \
   3885   int16x4_t __ret; \
   3886   int16x4_t __s0 = __p0; \
   3887   __ret = (int16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 1); \
   3888   __ret; \
   3889 })
   3890 #else
   3891 #define splat_lane_s16(__p0, __p1) __extension__ ({ \
   3892   int16x4_t __ret; \
   3893   int16x4_t __s0 = __p0; \
   3894   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   3895   __ret = (int16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 1); \
   3896   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3897   __ret; \
   3898 })
   3899 #define __noswap_splat_lane_s16(__p0, __p1) __extension__ ({ \
   3900   int16x4_t __ret; \
   3901   int16x4_t __s0 = __p0; \
   3902   __ret = (int16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 1); \
   3903   __ret; \
   3904 })
   3905 #endif
   3906 
   3907 #ifdef __LITTLE_ENDIAN__
   3908 #define splat_laneq_p8(__p0, __p1) __extension__ ({ \
   3909   poly8x8_t __ret; \
   3910   poly8x16_t __s0 = __p0; \
   3911   __ret = (poly8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 36); \
   3912   __ret; \
   3913 })
   3914 #else
   3915 #define splat_laneq_p8(__p0, __p1) __extension__ ({ \
   3916   poly8x8_t __ret; \
   3917   poly8x16_t __s0 = __p0; \
   3918   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   3919   __ret = (poly8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 36); \
   3920   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   3921   __ret; \
   3922 })
   3923 #define __noswap_splat_laneq_p8(__p0, __p1) __extension__ ({ \
   3924   poly8x8_t __ret; \
   3925   poly8x16_t __s0 = __p0; \
   3926   __ret = (poly8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 36); \
   3927   __ret; \
   3928 })
   3929 #endif
   3930 
   3931 #ifdef __LITTLE_ENDIAN__
   3932 #define splat_laneq_p64(__p0, __p1) __extension__ ({ \
   3933   poly64x1_t __ret; \
   3934   poly64x2_t __s0 = __p0; \
   3935   __ret = (poly64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 38); \
   3936   __ret; \
   3937 })
   3938 #else
   3939 #define splat_laneq_p64(__p0, __p1) __extension__ ({ \
   3940   poly64x1_t __ret; \
   3941   poly64x2_t __s0 = __p0; \
   3942   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   3943   __ret = (poly64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 38); \
   3944   __ret; \
   3945 })
   3946 #define __noswap_splat_laneq_p64(__p0, __p1) __extension__ ({ \
   3947   poly64x1_t __ret; \
   3948   poly64x2_t __s0 = __p0; \
   3949   __ret = (poly64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 38); \
   3950   __ret; \
   3951 })
   3952 #endif
   3953 
   3954 #ifdef __LITTLE_ENDIAN__
   3955 #define splat_laneq_p16(__p0, __p1) __extension__ ({ \
   3956   poly16x4_t __ret; \
   3957   poly16x8_t __s0 = __p0; \
   3958   __ret = (poly16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 37); \
   3959   __ret; \
   3960 })
   3961 #else
   3962 #define splat_laneq_p16(__p0, __p1) __extension__ ({ \
   3963   poly16x4_t __ret; \
   3964   poly16x8_t __s0 = __p0; \
   3965   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   3966   __ret = (poly16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 37); \
   3967   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   3968   __ret; \
   3969 })
   3970 #define __noswap_splat_laneq_p16(__p0, __p1) __extension__ ({ \
   3971   poly16x4_t __ret; \
   3972   poly16x8_t __s0 = __p0; \
   3973   __ret = (poly16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 37); \
   3974   __ret; \
   3975 })
   3976 #endif
   3977 
   3978 #ifdef __LITTLE_ENDIAN__
   3979 #define splatq_laneq_p8(__p0, __p1) __extension__ ({ \
   3980   poly8x16_t __ret; \
   3981   poly8x16_t __s0 = __p0; \
   3982   __ret = (poly8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 36); \
   3983   __ret; \
   3984 })
   3985 #else
   3986 #define splatq_laneq_p8(__p0, __p1) __extension__ ({ \
   3987   poly8x16_t __ret; \
   3988   poly8x16_t __s0 = __p0; \
   3989   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   3990   __ret = (poly8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 36); \
   3991   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   3992   __ret; \
   3993 })
   3994 #define __noswap_splatq_laneq_p8(__p0, __p1) __extension__ ({ \
   3995   poly8x16_t __ret; \
   3996   poly8x16_t __s0 = __p0; \
   3997   __ret = (poly8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 36); \
   3998   __ret; \
   3999 })
   4000 #endif
   4001 
   4002 #ifdef __LITTLE_ENDIAN__
   4003 #define splatq_laneq_p64(__p0, __p1) __extension__ ({ \
   4004   poly64x2_t __ret; \
   4005   poly64x2_t __s0 = __p0; \
   4006   __ret = (poly64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 38); \
   4007   __ret; \
   4008 })
   4009 #else
   4010 #define splatq_laneq_p64(__p0, __p1) __extension__ ({ \
   4011   poly64x2_t __ret; \
   4012   poly64x2_t __s0 = __p0; \
   4013   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4014   __ret = (poly64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 38); \
   4015   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4016   __ret; \
   4017 })
   4018 #define __noswap_splatq_laneq_p64(__p0, __p1) __extension__ ({ \
   4019   poly64x2_t __ret; \
   4020   poly64x2_t __s0 = __p0; \
   4021   __ret = (poly64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 38); \
   4022   __ret; \
   4023 })
   4024 #endif
   4025 
   4026 #ifdef __LITTLE_ENDIAN__
   4027 #define splatq_laneq_p16(__p0, __p1) __extension__ ({ \
   4028   poly16x8_t __ret; \
   4029   poly16x8_t __s0 = __p0; \
   4030   __ret = (poly16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 37); \
   4031   __ret; \
   4032 })
   4033 #else
   4034 #define splatq_laneq_p16(__p0, __p1) __extension__ ({ \
   4035   poly16x8_t __ret; \
   4036   poly16x8_t __s0 = __p0; \
   4037   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4038   __ret = (poly16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 37); \
   4039   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   4040   __ret; \
   4041 })
   4042 #define __noswap_splatq_laneq_p16(__p0, __p1) __extension__ ({ \
   4043   poly16x8_t __ret; \
   4044   poly16x8_t __s0 = __p0; \
   4045   __ret = (poly16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 37); \
   4046   __ret; \
   4047 })
   4048 #endif
   4049 
   4050 #ifdef __LITTLE_ENDIAN__
   4051 #define splatq_laneq_u8(__p0, __p1) __extension__ ({ \
   4052   uint8x16_t __ret; \
   4053   uint8x16_t __s0 = __p0; \
   4054   __ret = (uint8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 48); \
   4055   __ret; \
   4056 })
   4057 #else
   4058 #define splatq_laneq_u8(__p0, __p1) __extension__ ({ \
   4059   uint8x16_t __ret; \
   4060   uint8x16_t __s0 = __p0; \
   4061   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   4062   __ret = (uint8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 48); \
   4063   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   4064   __ret; \
   4065 })
   4066 #define __noswap_splatq_laneq_u8(__p0, __p1) __extension__ ({ \
   4067   uint8x16_t __ret; \
   4068   uint8x16_t __s0 = __p0; \
   4069   __ret = (uint8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 48); \
   4070   __ret; \
   4071 })
   4072 #endif
   4073 
   4074 #ifdef __LITTLE_ENDIAN__
   4075 #define splatq_laneq_u32(__p0, __p1) __extension__ ({ \
   4076   uint32x4_t __ret; \
   4077   uint32x4_t __s0 = __p0; \
   4078   __ret = (uint32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 50); \
   4079   __ret; \
   4080 })
   4081 #else
   4082 #define splatq_laneq_u32(__p0, __p1) __extension__ ({ \
   4083   uint32x4_t __ret; \
   4084   uint32x4_t __s0 = __p0; \
   4085   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   4086   __ret = (uint32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 50); \
   4087   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   4088   __ret; \
   4089 })
   4090 #define __noswap_splatq_laneq_u32(__p0, __p1) __extension__ ({ \
   4091   uint32x4_t __ret; \
   4092   uint32x4_t __s0 = __p0; \
   4093   __ret = (uint32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 50); \
   4094   __ret; \
   4095 })
   4096 #endif
   4097 
   4098 #ifdef __LITTLE_ENDIAN__
   4099 #define splatq_laneq_u64(__p0, __p1) __extension__ ({ \
   4100   uint64x2_t __ret; \
   4101   uint64x2_t __s0 = __p0; \
   4102   __ret = (uint64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 51); \
   4103   __ret; \
   4104 })
   4105 #else
   4106 #define splatq_laneq_u64(__p0, __p1) __extension__ ({ \
   4107   uint64x2_t __ret; \
   4108   uint64x2_t __s0 = __p0; \
   4109   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4110   __ret = (uint64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 51); \
   4111   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4112   __ret; \
   4113 })
   4114 #define __noswap_splatq_laneq_u64(__p0, __p1) __extension__ ({ \
   4115   uint64x2_t __ret; \
   4116   uint64x2_t __s0 = __p0; \
   4117   __ret = (uint64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 51); \
   4118   __ret; \
   4119 })
   4120 #endif
   4121 
   4122 #ifdef __LITTLE_ENDIAN__
   4123 #define splatq_laneq_u16(__p0, __p1) __extension__ ({ \
   4124   uint16x8_t __ret; \
   4125   uint16x8_t __s0 = __p0; \
   4126   __ret = (uint16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 49); \
   4127   __ret; \
   4128 })
   4129 #else
   4130 #define splatq_laneq_u16(__p0, __p1) __extension__ ({ \
   4131   uint16x8_t __ret; \
   4132   uint16x8_t __s0 = __p0; \
   4133   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4134   __ret = (uint16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 49); \
   4135   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   4136   __ret; \
   4137 })
   4138 #define __noswap_splatq_laneq_u16(__p0, __p1) __extension__ ({ \
   4139   uint16x8_t __ret; \
   4140   uint16x8_t __s0 = __p0; \
   4141   __ret = (uint16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 49); \
   4142   __ret; \
   4143 })
   4144 #endif
   4145 
   4146 #ifdef __LITTLE_ENDIAN__
   4147 #define splatq_laneq_s8(__p0, __p1) __extension__ ({ \
   4148   int8x16_t __ret; \
   4149   int8x16_t __s0 = __p0; \
   4150   __ret = (int8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 32); \
   4151   __ret; \
   4152 })
   4153 #else
   4154 #define splatq_laneq_s8(__p0, __p1) __extension__ ({ \
   4155   int8x16_t __ret; \
   4156   int8x16_t __s0 = __p0; \
   4157   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   4158   __ret = (int8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 32); \
   4159   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   4160   __ret; \
   4161 })
   4162 #define __noswap_splatq_laneq_s8(__p0, __p1) __extension__ ({ \
   4163   int8x16_t __ret; \
   4164   int8x16_t __s0 = __p0; \
   4165   __ret = (int8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 32); \
   4166   __ret; \
   4167 })
   4168 #endif
   4169 
   4170 #ifdef __LITTLE_ENDIAN__
   4171 #define splatq_laneq_f64(__p0, __p1) __extension__ ({ \
   4172   float64x2_t __ret; \
   4173   float64x2_t __s0 = __p0; \
   4174   __ret = (float64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 42); \
   4175   __ret; \
   4176 })
   4177 #else
   4178 #define splatq_laneq_f64(__p0, __p1) __extension__ ({ \
   4179   float64x2_t __ret; \
   4180   float64x2_t __s0 = __p0; \
   4181   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4182   __ret = (float64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 42); \
   4183   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4184   __ret; \
   4185 })
   4186 #define __noswap_splatq_laneq_f64(__p0, __p1) __extension__ ({ \
   4187   float64x2_t __ret; \
   4188   float64x2_t __s0 = __p0; \
   4189   __ret = (float64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 42); \
   4190   __ret; \
   4191 })
   4192 #endif
   4193 
   4194 #ifdef __LITTLE_ENDIAN__
   4195 #define splatq_laneq_f32(__p0, __p1) __extension__ ({ \
   4196   float32x4_t __ret; \
   4197   float32x4_t __s0 = __p0; \
   4198   __ret = (float32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 41); \
   4199   __ret; \
   4200 })
   4201 #else
   4202 #define splatq_laneq_f32(__p0, __p1) __extension__ ({ \
   4203   float32x4_t __ret; \
   4204   float32x4_t __s0 = __p0; \
   4205   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   4206   __ret = (float32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 41); \
   4207   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   4208   __ret; \
   4209 })
   4210 #define __noswap_splatq_laneq_f32(__p0, __p1) __extension__ ({ \
   4211   float32x4_t __ret; \
   4212   float32x4_t __s0 = __p0; \
   4213   __ret = (float32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 41); \
   4214   __ret; \
   4215 })
   4216 #endif
   4217 
   4218 #ifdef __LITTLE_ENDIAN__
   4219 #define splatq_laneq_f16(__p0, __p1) __extension__ ({ \
   4220   float16x8_t __ret; \
   4221   float16x8_t __s0 = __p0; \
   4222   __ret = (float16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 40); \
   4223   __ret; \
   4224 })
   4225 #else
   4226 #define splatq_laneq_f16(__p0, __p1) __extension__ ({ \
   4227   float16x8_t __ret; \
   4228   float16x8_t __s0 = __p0; \
   4229   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4230   __ret = (float16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 40); \
   4231   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   4232   __ret; \
   4233 })
   4234 #define __noswap_splatq_laneq_f16(__p0, __p1) __extension__ ({ \
   4235   float16x8_t __ret; \
   4236   float16x8_t __s0 = __p0; \
   4237   __ret = (float16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 40); \
   4238   __ret; \
   4239 })
   4240 #endif
   4241 
   4242 #ifdef __LITTLE_ENDIAN__
   4243 #define splatq_laneq_s32(__p0, __p1) __extension__ ({ \
   4244   int32x4_t __ret; \
   4245   int32x4_t __s0 = __p0; \
   4246   __ret = (int32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 34); \
   4247   __ret; \
   4248 })
   4249 #else
   4250 #define splatq_laneq_s32(__p0, __p1) __extension__ ({ \
   4251   int32x4_t __ret; \
   4252   int32x4_t __s0 = __p0; \
   4253   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   4254   __ret = (int32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 34); \
   4255   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   4256   __ret; \
   4257 })
   4258 #define __noswap_splatq_laneq_s32(__p0, __p1) __extension__ ({ \
   4259   int32x4_t __ret; \
   4260   int32x4_t __s0 = __p0; \
   4261   __ret = (int32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 34); \
   4262   __ret; \
   4263 })
   4264 #endif
   4265 
   4266 #ifdef __LITTLE_ENDIAN__
   4267 #define splatq_laneq_s64(__p0, __p1) __extension__ ({ \
   4268   int64x2_t __ret; \
   4269   int64x2_t __s0 = __p0; \
   4270   __ret = (int64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 35); \
   4271   __ret; \
   4272 })
   4273 #else
   4274 #define splatq_laneq_s64(__p0, __p1) __extension__ ({ \
   4275   int64x2_t __ret; \
   4276   int64x2_t __s0 = __p0; \
   4277   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4278   __ret = (int64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 35); \
   4279   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4280   __ret; \
   4281 })
   4282 #define __noswap_splatq_laneq_s64(__p0, __p1) __extension__ ({ \
   4283   int64x2_t __ret; \
   4284   int64x2_t __s0 = __p0; \
   4285   __ret = (int64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 35); \
   4286   __ret; \
   4287 })
   4288 #endif
   4289 
   4290 #ifdef __LITTLE_ENDIAN__
   4291 #define splatq_laneq_s16(__p0, __p1) __extension__ ({ \
   4292   int16x8_t __ret; \
   4293   int16x8_t __s0 = __p0; \
   4294   __ret = (int16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 33); \
   4295   __ret; \
   4296 })
   4297 #else
   4298 #define splatq_laneq_s16(__p0, __p1) __extension__ ({ \
   4299   int16x8_t __ret; \
   4300   int16x8_t __s0 = __p0; \
   4301   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4302   __ret = (int16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 33); \
   4303   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   4304   __ret; \
   4305 })
   4306 #define __noswap_splatq_laneq_s16(__p0, __p1) __extension__ ({ \
   4307   int16x8_t __ret; \
   4308   int16x8_t __s0 = __p0; \
   4309   __ret = (int16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 33); \
   4310   __ret; \
   4311 })
   4312 #endif
   4313 
   4314 #ifdef __LITTLE_ENDIAN__
   4315 #define splat_laneq_u8(__p0, __p1) __extension__ ({ \
   4316   uint8x8_t __ret; \
   4317   uint8x16_t __s0 = __p0; \
   4318   __ret = (uint8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 48); \
   4319   __ret; \
   4320 })
   4321 #else
   4322 #define splat_laneq_u8(__p0, __p1) __extension__ ({ \
   4323   uint8x8_t __ret; \
   4324   uint8x16_t __s0 = __p0; \
   4325   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   4326   __ret = (uint8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 48); \
   4327   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   4328   __ret; \
   4329 })
   4330 #define __noswap_splat_laneq_u8(__p0, __p1) __extension__ ({ \
   4331   uint8x8_t __ret; \
   4332   uint8x16_t __s0 = __p0; \
   4333   __ret = (uint8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 48); \
   4334   __ret; \
   4335 })
   4336 #endif
   4337 
   4338 #ifdef __LITTLE_ENDIAN__
   4339 #define splat_laneq_u32(__p0, __p1) __extension__ ({ \
   4340   uint32x2_t __ret; \
   4341   uint32x4_t __s0 = __p0; \
   4342   __ret = (uint32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 50); \
   4343   __ret; \
   4344 })
   4345 #else
   4346 #define splat_laneq_u32(__p0, __p1) __extension__ ({ \
   4347   uint32x2_t __ret; \
   4348   uint32x4_t __s0 = __p0; \
   4349   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   4350   __ret = (uint32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 50); \
   4351   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4352   __ret; \
   4353 })
   4354 #define __noswap_splat_laneq_u32(__p0, __p1) __extension__ ({ \
   4355   uint32x2_t __ret; \
   4356   uint32x4_t __s0 = __p0; \
   4357   __ret = (uint32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 50); \
   4358   __ret; \
   4359 })
   4360 #endif
   4361 
   4362 #ifdef __LITTLE_ENDIAN__
   4363 #define splat_laneq_u64(__p0, __p1) __extension__ ({ \
   4364   uint64x1_t __ret; \
   4365   uint64x2_t __s0 = __p0; \
   4366   __ret = (uint64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 51); \
   4367   __ret; \
   4368 })
   4369 #else
   4370 #define splat_laneq_u64(__p0, __p1) __extension__ ({ \
   4371   uint64x1_t __ret; \
   4372   uint64x2_t __s0 = __p0; \
   4373   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4374   __ret = (uint64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 51); \
   4375   __ret; \
   4376 })
   4377 #define __noswap_splat_laneq_u64(__p0, __p1) __extension__ ({ \
   4378   uint64x1_t __ret; \
   4379   uint64x2_t __s0 = __p0; \
   4380   __ret = (uint64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 51); \
   4381   __ret; \
   4382 })
   4383 #endif
   4384 
   4385 #ifdef __LITTLE_ENDIAN__
   4386 #define splat_laneq_u16(__p0, __p1) __extension__ ({ \
   4387   uint16x4_t __ret; \
   4388   uint16x8_t __s0 = __p0; \
   4389   __ret = (uint16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 49); \
   4390   __ret; \
   4391 })
   4392 #else
   4393 #define splat_laneq_u16(__p0, __p1) __extension__ ({ \
   4394   uint16x4_t __ret; \
   4395   uint16x8_t __s0 = __p0; \
   4396   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4397   __ret = (uint16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 49); \
   4398   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   4399   __ret; \
   4400 })
   4401 #define __noswap_splat_laneq_u16(__p0, __p1) __extension__ ({ \
   4402   uint16x4_t __ret; \
   4403   uint16x8_t __s0 = __p0; \
   4404   __ret = (uint16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 49); \
   4405   __ret; \
   4406 })
   4407 #endif
   4408 
   4409 #ifdef __LITTLE_ENDIAN__
   4410 #define splat_laneq_s8(__p0, __p1) __extension__ ({ \
   4411   int8x8_t __ret; \
   4412   int8x16_t __s0 = __p0; \
   4413   __ret = (int8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 32); \
   4414   __ret; \
   4415 })
   4416 #else
   4417 #define splat_laneq_s8(__p0, __p1) __extension__ ({ \
   4418   int8x8_t __ret; \
   4419   int8x16_t __s0 = __p0; \
   4420   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   4421   __ret = (int8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 32); \
   4422   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   4423   __ret; \
   4424 })
   4425 #define __noswap_splat_laneq_s8(__p0, __p1) __extension__ ({ \
   4426   int8x8_t __ret; \
   4427   int8x16_t __s0 = __p0; \
   4428   __ret = (int8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 32); \
   4429   __ret; \
   4430 })
   4431 #endif
   4432 
   4433 #ifdef __LITTLE_ENDIAN__
   4434 #define splat_laneq_f64(__p0, __p1) __extension__ ({ \
   4435   float64x1_t __ret; \
   4436   float64x2_t __s0 = __p0; \
   4437   __ret = (float64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 42); \
   4438   __ret; \
   4439 })
   4440 #else
   4441 #define splat_laneq_f64(__p0, __p1) __extension__ ({ \
   4442   float64x1_t __ret; \
   4443   float64x2_t __s0 = __p0; \
   4444   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4445   __ret = (float64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 42); \
   4446   __ret; \
   4447 })
   4448 #define __noswap_splat_laneq_f64(__p0, __p1) __extension__ ({ \
   4449   float64x1_t __ret; \
   4450   float64x2_t __s0 = __p0; \
   4451   __ret = (float64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 42); \
   4452   __ret; \
   4453 })
   4454 #endif
   4455 
   4456 #ifdef __LITTLE_ENDIAN__
   4457 #define splat_laneq_f32(__p0, __p1) __extension__ ({ \
   4458   float32x2_t __ret; \
   4459   float32x4_t __s0 = __p0; \
   4460   __ret = (float32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 41); \
   4461   __ret; \
   4462 })
   4463 #else
   4464 #define splat_laneq_f32(__p0, __p1) __extension__ ({ \
   4465   float32x2_t __ret; \
   4466   float32x4_t __s0 = __p0; \
   4467   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   4468   __ret = (float32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 41); \
   4469   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4470   __ret; \
   4471 })
   4472 #define __noswap_splat_laneq_f32(__p0, __p1) __extension__ ({ \
   4473   float32x2_t __ret; \
   4474   float32x4_t __s0 = __p0; \
   4475   __ret = (float32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 41); \
   4476   __ret; \
   4477 })
   4478 #endif
   4479 
   4480 #ifdef __LITTLE_ENDIAN__
   4481 #define splat_laneq_f16(__p0, __p1) __extension__ ({ \
   4482   float16x4_t __ret; \
   4483   float16x8_t __s0 = __p0; \
   4484   __ret = (float16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 40); \
   4485   __ret; \
   4486 })
   4487 #else
   4488 #define splat_laneq_f16(__p0, __p1) __extension__ ({ \
   4489   float16x4_t __ret; \
   4490   float16x8_t __s0 = __p0; \
   4491   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4492   __ret = (float16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 40); \
   4493   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   4494   __ret; \
   4495 })
   4496 #define __noswap_splat_laneq_f16(__p0, __p1) __extension__ ({ \
   4497   float16x4_t __ret; \
   4498   float16x8_t __s0 = __p0; \
   4499   __ret = (float16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 40); \
   4500   __ret; \
   4501 })
   4502 #endif
   4503 
   4504 #ifdef __LITTLE_ENDIAN__
   4505 #define splat_laneq_s32(__p0, __p1) __extension__ ({ \
   4506   int32x2_t __ret; \
   4507   int32x4_t __s0 = __p0; \
   4508   __ret = (int32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 34); \
   4509   __ret; \
   4510 })
   4511 #else
   4512 #define splat_laneq_s32(__p0, __p1) __extension__ ({ \
   4513   int32x2_t __ret; \
   4514   int32x4_t __s0 = __p0; \
   4515   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   4516   __ret = (int32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 34); \
   4517   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   4518   __ret; \
   4519 })
   4520 #define __noswap_splat_laneq_s32(__p0, __p1) __extension__ ({ \
   4521   int32x2_t __ret; \
   4522   int32x4_t __s0 = __p0; \
   4523   __ret = (int32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 34); \
   4524   __ret; \
   4525 })
   4526 #endif
   4527 
   4528 #ifdef __LITTLE_ENDIAN__
   4529 #define splat_laneq_s64(__p0, __p1) __extension__ ({ \
   4530   int64x1_t __ret; \
   4531   int64x2_t __s0 = __p0; \
   4532   __ret = (int64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 35); \
   4533   __ret; \
   4534 })
   4535 #else
   4536 #define splat_laneq_s64(__p0, __p1) __extension__ ({ \
   4537   int64x1_t __ret; \
   4538   int64x2_t __s0 = __p0; \
   4539   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   4540   __ret = (int64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 35); \
   4541   __ret; \
   4542 })
   4543 #define __noswap_splat_laneq_s64(__p0, __p1) __extension__ ({ \
   4544   int64x1_t __ret; \
   4545   int64x2_t __s0 = __p0; \
   4546   __ret = (int64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 35); \
   4547   __ret; \
   4548 })
   4549 #endif
   4550 
   4551 #ifdef __LITTLE_ENDIAN__
   4552 #define splat_laneq_s16(__p0, __p1) __extension__ ({ \
   4553   int16x4_t __ret; \
   4554   int16x8_t __s0 = __p0; \
   4555   __ret = (int16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 33); \
   4556   __ret; \
   4557 })
   4558 #else
   4559 #define splat_laneq_s16(__p0, __p1) __extension__ ({ \
   4560   int16x4_t __ret; \
   4561   int16x8_t __s0 = __p0; \
   4562   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   4563   __ret = (int16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 33); \
   4564   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   4565   __ret; \
   4566 })
   4567 #define __noswap_splat_laneq_s16(__p0, __p1) __extension__ ({ \
   4568   int16x4_t __ret; \
   4569   int16x8_t __s0 = __p0; \
   4570   __ret = (int16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 33); \
   4571   __ret; \
   4572 })
   4573 #endif
   4574 
   4575 #ifdef __LITTLE_ENDIAN__
   4576 __ai __attribute__((target("neon"))) uint8x16_t vabdq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   4577   uint8x16_t __ret;
   4578   __ret = (uint8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
   4579   return __ret;
   4580 }
   4581 #else
   4582 __ai __attribute__((target("neon"))) uint8x16_t vabdq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   4583   uint8x16_t __ret;
   4584   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4585   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4586   __ret = (uint8x16_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
   4587   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4588   return __ret;
   4589 }
   4590 __ai __attribute__((target("neon"))) uint8x16_t __noswap_vabdq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   4591   uint8x16_t __ret;
   4592   __ret = (uint8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
   4593   return __ret;
   4594 }
   4595 #endif
   4596 
   4597 #ifdef __LITTLE_ENDIAN__
   4598 __ai __attribute__((target("neon"))) uint32x4_t vabdq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   4599   uint32x4_t __ret;
   4600   __ret = (uint32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
   4601   return __ret;
   4602 }
   4603 #else
   4604 __ai __attribute__((target("neon"))) uint32x4_t vabdq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   4605   uint32x4_t __ret;
   4606   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4607   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   4608   __ret = (uint32x4_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
   4609   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4610   return __ret;
   4611 }
   4612 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vabdq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   4613   uint32x4_t __ret;
   4614   __ret = (uint32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
   4615   return __ret;
   4616 }
   4617 #endif
   4618 
   4619 #ifdef __LITTLE_ENDIAN__
   4620 __ai __attribute__((target("neon"))) uint16x8_t vabdq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   4621   uint16x8_t __ret;
   4622   __ret = (uint16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
   4623   return __ret;
   4624 }
   4625 #else
   4626 __ai __attribute__((target("neon"))) uint16x8_t vabdq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   4627   uint16x8_t __ret;
   4628   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   4629   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   4630   __ret = (uint16x8_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
   4631   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   4632   return __ret;
   4633 }
   4634 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vabdq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   4635   uint16x8_t __ret;
   4636   __ret = (uint16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
   4637   return __ret;
   4638 }
   4639 #endif
   4640 
   4641 #ifdef __LITTLE_ENDIAN__
   4642 __ai __attribute__((target("neon"))) int8x16_t vabdq_s8(int8x16_t __p0, int8x16_t __p1) {
   4643   int8x16_t __ret;
   4644   __ret = (int8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
   4645   return __ret;
   4646 }
   4647 #else
   4648 __ai __attribute__((target("neon"))) int8x16_t vabdq_s8(int8x16_t __p0, int8x16_t __p1) {
   4649   int8x16_t __ret;
   4650   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4651   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4652   __ret = (int8x16_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
   4653   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4654   return __ret;
   4655 }
   4656 __ai __attribute__((target("neon"))) int8x16_t __noswap_vabdq_s8(int8x16_t __p0, int8x16_t __p1) {
   4657   int8x16_t __ret;
   4658   __ret = (int8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
   4659   return __ret;
   4660 }
   4661 #endif
   4662 
   4663 #ifdef __LITTLE_ENDIAN__
   4664 __ai __attribute__((target("neon"))) float32x4_t vabdq_f32(float32x4_t __p0, float32x4_t __p1) {
   4665   float32x4_t __ret;
   4666   __ret = (float32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
   4667   return __ret;
   4668 }
   4669 #else
   4670 __ai __attribute__((target("neon"))) float32x4_t vabdq_f32(float32x4_t __p0, float32x4_t __p1) {
   4671   float32x4_t __ret;
   4672   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4673   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   4674   __ret = (float32x4_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
   4675   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4676   return __ret;
   4677 }
   4678 #endif
   4679 
   4680 #ifdef __LITTLE_ENDIAN__
   4681 __ai __attribute__((target("neon"))) int32x4_t vabdq_s32(int32x4_t __p0, int32x4_t __p1) {
   4682   int32x4_t __ret;
   4683   __ret = (int32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
   4684   return __ret;
   4685 }
   4686 #else
   4687 __ai __attribute__((target("neon"))) int32x4_t vabdq_s32(int32x4_t __p0, int32x4_t __p1) {
   4688   int32x4_t __ret;
   4689   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4690   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   4691   __ret = (int32x4_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
   4692   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4693   return __ret;
   4694 }
   4695 __ai __attribute__((target("neon"))) int32x4_t __noswap_vabdq_s32(int32x4_t __p0, int32x4_t __p1) {
   4696   int32x4_t __ret;
   4697   __ret = (int32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
   4698   return __ret;
   4699 }
   4700 #endif
   4701 
   4702 #ifdef __LITTLE_ENDIAN__
   4703 __ai __attribute__((target("neon"))) int16x8_t vabdq_s16(int16x8_t __p0, int16x8_t __p1) {
   4704   int16x8_t __ret;
   4705   __ret = (int16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
   4706   return __ret;
   4707 }
   4708 #else
   4709 __ai __attribute__((target("neon"))) int16x8_t vabdq_s16(int16x8_t __p0, int16x8_t __p1) {
   4710   int16x8_t __ret;
   4711   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   4712   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   4713   __ret = (int16x8_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
   4714   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   4715   return __ret;
   4716 }
   4717 __ai __attribute__((target("neon"))) int16x8_t __noswap_vabdq_s16(int16x8_t __p0, int16x8_t __p1) {
   4718   int16x8_t __ret;
   4719   __ret = (int16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
   4720   return __ret;
   4721 }
   4722 #endif
   4723 
   4724 #ifdef __LITTLE_ENDIAN__
   4725 __ai __attribute__((target("neon"))) uint8x8_t vabd_u8(uint8x8_t __p0, uint8x8_t __p1) {
   4726   uint8x8_t __ret;
   4727   __ret = (uint8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
   4728   return __ret;
   4729 }
   4730 #else
   4731 __ai __attribute__((target("neon"))) uint8x8_t vabd_u8(uint8x8_t __p0, uint8x8_t __p1) {
   4732   uint8x8_t __ret;
   4733   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   4734   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   4735   __ret = (uint8x8_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
   4736   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   4737   return __ret;
   4738 }
   4739 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vabd_u8(uint8x8_t __p0, uint8x8_t __p1) {
   4740   uint8x8_t __ret;
   4741   __ret = (uint8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
   4742   return __ret;
   4743 }
   4744 #endif
   4745 
   4746 #ifdef __LITTLE_ENDIAN__
   4747 __ai __attribute__((target("neon"))) uint32x2_t vabd_u32(uint32x2_t __p0, uint32x2_t __p1) {
   4748   uint32x2_t __ret;
   4749   __ret = (uint32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
   4750   return __ret;
   4751 }
   4752 #else
   4753 __ai __attribute__((target("neon"))) uint32x2_t vabd_u32(uint32x2_t __p0, uint32x2_t __p1) {
   4754   uint32x2_t __ret;
   4755   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   4756   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   4757   __ret = (uint32x2_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
   4758   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   4759   return __ret;
   4760 }
   4761 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vabd_u32(uint32x2_t __p0, uint32x2_t __p1) {
   4762   uint32x2_t __ret;
   4763   __ret = (uint32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
   4764   return __ret;
   4765 }
   4766 #endif
   4767 
   4768 #ifdef __LITTLE_ENDIAN__
   4769 __ai __attribute__((target("neon"))) uint16x4_t vabd_u16(uint16x4_t __p0, uint16x4_t __p1) {
   4770   uint16x4_t __ret;
   4771   __ret = (uint16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
   4772   return __ret;
   4773 }
   4774 #else
   4775 __ai __attribute__((target("neon"))) uint16x4_t vabd_u16(uint16x4_t __p0, uint16x4_t __p1) {
   4776   uint16x4_t __ret;
   4777   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4778   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   4779   __ret = (uint16x4_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
   4780   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4781   return __ret;
   4782 }
   4783 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vabd_u16(uint16x4_t __p0, uint16x4_t __p1) {
   4784   uint16x4_t __ret;
   4785   __ret = (uint16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
   4786   return __ret;
   4787 }
   4788 #endif
   4789 
   4790 #ifdef __LITTLE_ENDIAN__
   4791 __ai __attribute__((target("neon"))) int8x8_t vabd_s8(int8x8_t __p0, int8x8_t __p1) {
   4792   int8x8_t __ret;
   4793   __ret = (int8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
   4794   return __ret;
   4795 }
   4796 #else
   4797 __ai __attribute__((target("neon"))) int8x8_t vabd_s8(int8x8_t __p0, int8x8_t __p1) {
   4798   int8x8_t __ret;
   4799   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   4800   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   4801   __ret = (int8x8_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
   4802   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   4803   return __ret;
   4804 }
   4805 __ai __attribute__((target("neon"))) int8x8_t __noswap_vabd_s8(int8x8_t __p0, int8x8_t __p1) {
   4806   int8x8_t __ret;
   4807   __ret = (int8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
   4808   return __ret;
   4809 }
   4810 #endif
   4811 
   4812 #ifdef __LITTLE_ENDIAN__
   4813 __ai __attribute__((target("neon"))) float32x2_t vabd_f32(float32x2_t __p0, float32x2_t __p1) {
   4814   float32x2_t __ret;
   4815   __ret = (float32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
   4816   return __ret;
   4817 }
   4818 #else
   4819 __ai __attribute__((target("neon"))) float32x2_t vabd_f32(float32x2_t __p0, float32x2_t __p1) {
   4820   float32x2_t __ret;
   4821   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   4822   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   4823   __ret = (float32x2_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
   4824   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   4825   return __ret;
   4826 }
   4827 #endif
   4828 
   4829 #ifdef __LITTLE_ENDIAN__
   4830 __ai __attribute__((target("neon"))) int32x2_t vabd_s32(int32x2_t __p0, int32x2_t __p1) {
   4831   int32x2_t __ret;
   4832   __ret = (int32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
   4833   return __ret;
   4834 }
   4835 #else
   4836 __ai __attribute__((target("neon"))) int32x2_t vabd_s32(int32x2_t __p0, int32x2_t __p1) {
   4837   int32x2_t __ret;
   4838   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   4839   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   4840   __ret = (int32x2_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
   4841   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   4842   return __ret;
   4843 }
   4844 __ai __attribute__((target("neon"))) int32x2_t __noswap_vabd_s32(int32x2_t __p0, int32x2_t __p1) {
   4845   int32x2_t __ret;
   4846   __ret = (int32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
   4847   return __ret;
   4848 }
   4849 #endif
   4850 
   4851 #ifdef __LITTLE_ENDIAN__
   4852 __ai __attribute__((target("neon"))) int16x4_t vabd_s16(int16x4_t __p0, int16x4_t __p1) {
   4853   int16x4_t __ret;
   4854   __ret = (int16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
   4855   return __ret;
   4856 }
   4857 #else
   4858 __ai __attribute__((target("neon"))) int16x4_t vabd_s16(int16x4_t __p0, int16x4_t __p1) {
   4859   int16x4_t __ret;
   4860   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4861   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   4862   __ret = (int16x4_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
   4863   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4864   return __ret;
   4865 }
   4866 __ai __attribute__((target("neon"))) int16x4_t __noswap_vabd_s16(int16x4_t __p0, int16x4_t __p1) {
   4867   int16x4_t __ret;
   4868   __ret = (int16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
   4869   return __ret;
   4870 }
   4871 #endif
   4872 
   4873 #ifdef __LITTLE_ENDIAN__
   4874 __ai __attribute__((target("neon"))) int8x16_t vabsq_s8(int8x16_t __p0) {
   4875   int8x16_t __ret;
   4876   __ret = (int8x16_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 32);
   4877   return __ret;
   4878 }
   4879 #else
   4880 __ai __attribute__((target("neon"))) int8x16_t vabsq_s8(int8x16_t __p0) {
   4881   int8x16_t __ret;
   4882   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4883   __ret = (int8x16_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 32);
   4884   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   4885   return __ret;
   4886 }
   4887 #endif
   4888 
   4889 #ifdef __LITTLE_ENDIAN__
   4890 __ai __attribute__((target("neon"))) float32x4_t vabsq_f32(float32x4_t __p0) {
   4891   float32x4_t __ret;
   4892   __ret = (float32x4_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 41);
   4893   return __ret;
   4894 }
   4895 #else
   4896 __ai __attribute__((target("neon"))) float32x4_t vabsq_f32(float32x4_t __p0) {
   4897   float32x4_t __ret;
   4898   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4899   __ret = (float32x4_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 41);
   4900   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4901   return __ret;
   4902 }
   4903 #endif
   4904 
   4905 #ifdef __LITTLE_ENDIAN__
   4906 __ai __attribute__((target("neon"))) int32x4_t vabsq_s32(int32x4_t __p0) {
   4907   int32x4_t __ret;
   4908   __ret = (int32x4_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 34);
   4909   return __ret;
   4910 }
   4911 #else
   4912 __ai __attribute__((target("neon"))) int32x4_t vabsq_s32(int32x4_t __p0) {
   4913   int32x4_t __ret;
   4914   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4915   __ret = (int32x4_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 34);
   4916   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4917   return __ret;
   4918 }
   4919 #endif
   4920 
   4921 #ifdef __LITTLE_ENDIAN__
   4922 __ai __attribute__((target("neon"))) int16x8_t vabsq_s16(int16x8_t __p0) {
   4923   int16x8_t __ret;
   4924   __ret = (int16x8_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 33);
   4925   return __ret;
   4926 }
   4927 #else
   4928 __ai __attribute__((target("neon"))) int16x8_t vabsq_s16(int16x8_t __p0) {
   4929   int16x8_t __ret;
   4930   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   4931   __ret = (int16x8_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 33);
   4932   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   4933   return __ret;
   4934 }
   4935 #endif
   4936 
   4937 #ifdef __LITTLE_ENDIAN__
   4938 __ai __attribute__((target("neon"))) int8x8_t vabs_s8(int8x8_t __p0) {
   4939   int8x8_t __ret;
   4940   __ret = (int8x8_t) __builtin_neon_vabs_v((int8x8_t)__p0, 0);
   4941   return __ret;
   4942 }
   4943 #else
   4944 __ai __attribute__((target("neon"))) int8x8_t vabs_s8(int8x8_t __p0) {
   4945   int8x8_t __ret;
   4946   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   4947   __ret = (int8x8_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 0);
   4948   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   4949   return __ret;
   4950 }
   4951 #endif
   4952 
   4953 #ifdef __LITTLE_ENDIAN__
   4954 __ai __attribute__((target("neon"))) float32x2_t vabs_f32(float32x2_t __p0) {
   4955   float32x2_t __ret;
   4956   __ret = (float32x2_t) __builtin_neon_vabs_v((int8x8_t)__p0, 9);
   4957   return __ret;
   4958 }
   4959 #else
   4960 __ai __attribute__((target("neon"))) float32x2_t vabs_f32(float32x2_t __p0) {
   4961   float32x2_t __ret;
   4962   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   4963   __ret = (float32x2_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 9);
   4964   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   4965   return __ret;
   4966 }
   4967 #endif
   4968 
   4969 #ifdef __LITTLE_ENDIAN__
   4970 __ai __attribute__((target("neon"))) int32x2_t vabs_s32(int32x2_t __p0) {
   4971   int32x2_t __ret;
   4972   __ret = (int32x2_t) __builtin_neon_vabs_v((int8x8_t)__p0, 2);
   4973   return __ret;
   4974 }
   4975 #else
   4976 __ai __attribute__((target("neon"))) int32x2_t vabs_s32(int32x2_t __p0) {
   4977   int32x2_t __ret;
   4978   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   4979   __ret = (int32x2_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 2);
   4980   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   4981   return __ret;
   4982 }
   4983 #endif
   4984 
   4985 #ifdef __LITTLE_ENDIAN__
   4986 __ai __attribute__((target("neon"))) int16x4_t vabs_s16(int16x4_t __p0) {
   4987   int16x4_t __ret;
   4988   __ret = (int16x4_t) __builtin_neon_vabs_v((int8x8_t)__p0, 1);
   4989   return __ret;
   4990 }
   4991 #else
   4992 __ai __attribute__((target("neon"))) int16x4_t vabs_s16(int16x4_t __p0) {
   4993   int16x4_t __ret;
   4994   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   4995   __ret = (int16x4_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 1);
   4996   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   4997   return __ret;
   4998 }
   4999 #endif
   5000 
   5001 #ifdef __LITTLE_ENDIAN__
   5002 __ai __attribute__((target("neon"))) uint8x16_t vaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   5003   uint8x16_t __ret;
   5004   __ret = __p0 + __p1;
   5005   return __ret;
   5006 }
   5007 #else
   5008 __ai __attribute__((target("neon"))) uint8x16_t vaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   5009   uint8x16_t __ret;
   5010   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5011   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5012   __ret = __rev0 + __rev1;
   5013   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5014   return __ret;
   5015 }
   5016 #endif
   5017 
   5018 #ifdef __LITTLE_ENDIAN__
   5019 __ai __attribute__((target("neon"))) uint32x4_t vaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5020   uint32x4_t __ret;
   5021   __ret = __p0 + __p1;
   5022   return __ret;
   5023 }
   5024 #else
   5025 __ai __attribute__((target("neon"))) uint32x4_t vaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5026   uint32x4_t __ret;
   5027   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5028   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5029   __ret = __rev0 + __rev1;
   5030   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5031   return __ret;
   5032 }
   5033 #endif
   5034 
   5035 #ifdef __LITTLE_ENDIAN__
   5036 __ai __attribute__((target("neon"))) uint64x2_t vaddq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5037   uint64x2_t __ret;
   5038   __ret = __p0 + __p1;
   5039   return __ret;
   5040 }
   5041 #else
   5042 __ai __attribute__((target("neon"))) uint64x2_t vaddq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5043   uint64x2_t __ret;
   5044   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5045   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5046   __ret = __rev0 + __rev1;
   5047   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5048   return __ret;
   5049 }
   5050 #endif
   5051 
   5052 #ifdef __LITTLE_ENDIAN__
   5053 __ai __attribute__((target("neon"))) uint16x8_t vaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5054   uint16x8_t __ret;
   5055   __ret = __p0 + __p1;
   5056   return __ret;
   5057 }
   5058 #else
   5059 __ai __attribute__((target("neon"))) uint16x8_t vaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5060   uint16x8_t __ret;
   5061   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5062   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5063   __ret = __rev0 + __rev1;
   5064   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5065   return __ret;
   5066 }
   5067 #endif
   5068 
   5069 #ifdef __LITTLE_ENDIAN__
   5070 __ai __attribute__((target("neon"))) int8x16_t vaddq_s8(int8x16_t __p0, int8x16_t __p1) {
   5071   int8x16_t __ret;
   5072   __ret = __p0 + __p1;
   5073   return __ret;
   5074 }
   5075 #else
   5076 __ai __attribute__((target("neon"))) int8x16_t vaddq_s8(int8x16_t __p0, int8x16_t __p1) {
   5077   int8x16_t __ret;
   5078   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5079   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5080   __ret = __rev0 + __rev1;
   5081   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5082   return __ret;
   5083 }
   5084 #endif
   5085 
   5086 #ifdef __LITTLE_ENDIAN__
   5087 __ai __attribute__((target("neon"))) float32x4_t vaddq_f32(float32x4_t __p0, float32x4_t __p1) {
   5088   float32x4_t __ret;
   5089   __ret = __p0 + __p1;
   5090   return __ret;
   5091 }
   5092 #else
   5093 __ai __attribute__((target("neon"))) float32x4_t vaddq_f32(float32x4_t __p0, float32x4_t __p1) {
   5094   float32x4_t __ret;
   5095   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5096   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5097   __ret = __rev0 + __rev1;
   5098   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5099   return __ret;
   5100 }
   5101 #endif
   5102 
   5103 #ifdef __LITTLE_ENDIAN__
   5104 __ai __attribute__((target("neon"))) int32x4_t vaddq_s32(int32x4_t __p0, int32x4_t __p1) {
   5105   int32x4_t __ret;
   5106   __ret = __p0 + __p1;
   5107   return __ret;
   5108 }
   5109 #else
   5110 __ai __attribute__((target("neon"))) int32x4_t vaddq_s32(int32x4_t __p0, int32x4_t __p1) {
   5111   int32x4_t __ret;
   5112   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5113   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5114   __ret = __rev0 + __rev1;
   5115   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5116   return __ret;
   5117 }
   5118 #endif
   5119 
   5120 #ifdef __LITTLE_ENDIAN__
   5121 __ai __attribute__((target("neon"))) int64x2_t vaddq_s64(int64x2_t __p0, int64x2_t __p1) {
   5122   int64x2_t __ret;
   5123   __ret = __p0 + __p1;
   5124   return __ret;
   5125 }
   5126 #else
   5127 __ai __attribute__((target("neon"))) int64x2_t vaddq_s64(int64x2_t __p0, int64x2_t __p1) {
   5128   int64x2_t __ret;
   5129   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5130   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5131   __ret = __rev0 + __rev1;
   5132   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5133   return __ret;
   5134 }
   5135 #endif
   5136 
   5137 #ifdef __LITTLE_ENDIAN__
   5138 __ai __attribute__((target("neon"))) int16x8_t vaddq_s16(int16x8_t __p0, int16x8_t __p1) {
   5139   int16x8_t __ret;
   5140   __ret = __p0 + __p1;
   5141   return __ret;
   5142 }
   5143 #else
   5144 __ai __attribute__((target("neon"))) int16x8_t vaddq_s16(int16x8_t __p0, int16x8_t __p1) {
   5145   int16x8_t __ret;
   5146   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5147   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5148   __ret = __rev0 + __rev1;
   5149   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5150   return __ret;
   5151 }
   5152 #endif
   5153 
   5154 #ifdef __LITTLE_ENDIAN__
   5155 __ai __attribute__((target("neon"))) uint8x8_t vadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
   5156   uint8x8_t __ret;
   5157   __ret = __p0 + __p1;
   5158   return __ret;
   5159 }
   5160 #else
   5161 __ai __attribute__((target("neon"))) uint8x8_t vadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
   5162   uint8x8_t __ret;
   5163   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5164   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5165   __ret = __rev0 + __rev1;
   5166   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5167   return __ret;
   5168 }
   5169 #endif
   5170 
   5171 #ifdef __LITTLE_ENDIAN__
   5172 __ai __attribute__((target("neon"))) uint32x2_t vadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
   5173   uint32x2_t __ret;
   5174   __ret = __p0 + __p1;
   5175   return __ret;
   5176 }
   5177 #else
   5178 __ai __attribute__((target("neon"))) uint32x2_t vadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
   5179   uint32x2_t __ret;
   5180   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5181   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5182   __ret = __rev0 + __rev1;
   5183   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5184   return __ret;
   5185 }
   5186 #endif
   5187 
   5188 __ai __attribute__((target("neon"))) uint64x1_t vadd_u64(uint64x1_t __p0, uint64x1_t __p1) {
   5189   uint64x1_t __ret;
   5190   __ret = __p0 + __p1;
   5191   return __ret;
   5192 }
   5193 #ifdef __LITTLE_ENDIAN__
   5194 __ai __attribute__((target("neon"))) uint16x4_t vadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
   5195   uint16x4_t __ret;
   5196   __ret = __p0 + __p1;
   5197   return __ret;
   5198 }
   5199 #else
   5200 __ai __attribute__((target("neon"))) uint16x4_t vadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
   5201   uint16x4_t __ret;
   5202   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5203   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5204   __ret = __rev0 + __rev1;
   5205   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5206   return __ret;
   5207 }
   5208 #endif
   5209 
   5210 #ifdef __LITTLE_ENDIAN__
   5211 __ai __attribute__((target("neon"))) int8x8_t vadd_s8(int8x8_t __p0, int8x8_t __p1) {
   5212   int8x8_t __ret;
   5213   __ret = __p0 + __p1;
   5214   return __ret;
   5215 }
   5216 #else
   5217 __ai __attribute__((target("neon"))) int8x8_t vadd_s8(int8x8_t __p0, int8x8_t __p1) {
   5218   int8x8_t __ret;
   5219   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5220   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5221   __ret = __rev0 + __rev1;
   5222   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5223   return __ret;
   5224 }
   5225 #endif
   5226 
   5227 #ifdef __LITTLE_ENDIAN__
   5228 __ai __attribute__((target("neon"))) float32x2_t vadd_f32(float32x2_t __p0, float32x2_t __p1) {
   5229   float32x2_t __ret;
   5230   __ret = __p0 + __p1;
   5231   return __ret;
   5232 }
   5233 #else
   5234 __ai __attribute__((target("neon"))) float32x2_t vadd_f32(float32x2_t __p0, float32x2_t __p1) {
   5235   float32x2_t __ret;
   5236   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5237   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5238   __ret = __rev0 + __rev1;
   5239   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5240   return __ret;
   5241 }
   5242 #endif
   5243 
   5244 #ifdef __LITTLE_ENDIAN__
   5245 __ai __attribute__((target("neon"))) int32x2_t vadd_s32(int32x2_t __p0, int32x2_t __p1) {
   5246   int32x2_t __ret;
   5247   __ret = __p0 + __p1;
   5248   return __ret;
   5249 }
   5250 #else
   5251 __ai __attribute__((target("neon"))) int32x2_t vadd_s32(int32x2_t __p0, int32x2_t __p1) {
   5252   int32x2_t __ret;
   5253   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5254   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5255   __ret = __rev0 + __rev1;
   5256   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5257   return __ret;
   5258 }
   5259 #endif
   5260 
   5261 __ai __attribute__((target("neon"))) int64x1_t vadd_s64(int64x1_t __p0, int64x1_t __p1) {
   5262   int64x1_t __ret;
   5263   __ret = __p0 + __p1;
   5264   return __ret;
   5265 }
   5266 #ifdef __LITTLE_ENDIAN__
   5267 __ai __attribute__((target("neon"))) int16x4_t vadd_s16(int16x4_t __p0, int16x4_t __p1) {
   5268   int16x4_t __ret;
   5269   __ret = __p0 + __p1;
   5270   return __ret;
   5271 }
   5272 #else
   5273 __ai __attribute__((target("neon"))) int16x4_t vadd_s16(int16x4_t __p0, int16x4_t __p1) {
   5274   int16x4_t __ret;
   5275   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5276   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5277   __ret = __rev0 + __rev1;
   5278   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5279   return __ret;
   5280 }
   5281 #endif
   5282 
   5283 #ifdef __LITTLE_ENDIAN__
   5284 __ai __attribute__((target("neon"))) poly8x8_t vadd_p8(poly8x8_t __p0, poly8x8_t __p1) {
   5285   poly8x8_t __ret;
   5286   __ret = (poly8x8_t) __builtin_neon_vadd_v((int8x8_t)__p0, (int8x8_t)__p1, 4);
   5287   return __ret;
   5288 }
   5289 #else
   5290 __ai __attribute__((target("neon"))) poly8x8_t vadd_p8(poly8x8_t __p0, poly8x8_t __p1) {
   5291   poly8x8_t __ret;
   5292   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5293   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5294   __ret = (poly8x8_t) __builtin_neon_vadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 4);
   5295   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5296   return __ret;
   5297 }
   5298 #endif
   5299 
   5300 __ai __attribute__((target("neon"))) poly64x1_t vadd_p64(poly64x1_t __p0, poly64x1_t __p1) {
   5301   poly64x1_t __ret;
   5302   __ret = (poly64x1_t) __builtin_neon_vadd_v((int8x8_t)__p0, (int8x8_t)__p1, 6);
   5303   return __ret;
   5304 }
   5305 #ifdef __LITTLE_ENDIAN__
   5306 __ai __attribute__((target("neon"))) poly16x4_t vadd_p16(poly16x4_t __p0, poly16x4_t __p1) {
   5307   poly16x4_t __ret;
   5308   __ret = (poly16x4_t) __builtin_neon_vadd_v((int8x8_t)__p0, (int8x8_t)__p1, 5);
   5309   return __ret;
   5310 }
   5311 #else
   5312 __ai __attribute__((target("neon"))) poly16x4_t vadd_p16(poly16x4_t __p0, poly16x4_t __p1) {
   5313   poly16x4_t __ret;
   5314   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5315   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5316   __ret = (poly16x4_t) __builtin_neon_vadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 5);
   5317   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5318   return __ret;
   5319 }
   5320 #endif
   5321 
   5322 #ifdef __LITTLE_ENDIAN__
   5323 __ai __attribute__((target("neon"))) poly8x16_t vaddq_p8(poly8x16_t __p0, poly8x16_t __p1) {
   5324   poly8x16_t __ret;
   5325   __ret = (poly8x16_t) __builtin_neon_vaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 36);
   5326   return __ret;
   5327 }
   5328 #else
   5329 __ai __attribute__((target("neon"))) poly8x16_t vaddq_p8(poly8x16_t __p0, poly8x16_t __p1) {
   5330   poly8x16_t __ret;
   5331   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5332   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5333   __ret = (poly8x16_t) __builtin_neon_vaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 36);
   5334   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5335   return __ret;
   5336 }
   5337 #endif
   5338 
   5339 #ifdef __LITTLE_ENDIAN__
   5340 __ai __attribute__((target("neon"))) poly64x2_t vaddq_p64(poly64x2_t __p0, poly64x2_t __p1) {
   5341   poly64x2_t __ret;
   5342   __ret = (poly64x2_t) __builtin_neon_vaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 38);
   5343   return __ret;
   5344 }
   5345 #else
   5346 __ai __attribute__((target("neon"))) poly64x2_t vaddq_p64(poly64x2_t __p0, poly64x2_t __p1) {
   5347   poly64x2_t __ret;
   5348   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5349   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5350   __ret = (poly64x2_t) __builtin_neon_vaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 38);
   5351   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5352   return __ret;
   5353 }
   5354 #endif
   5355 
   5356 #ifdef __LITTLE_ENDIAN__
   5357 __ai __attribute__((target("neon"))) poly16x8_t vaddq_p16(poly16x8_t __p0, poly16x8_t __p1) {
   5358   poly16x8_t __ret;
   5359   __ret = (poly16x8_t) __builtin_neon_vaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 37);
   5360   return __ret;
   5361 }
   5362 #else
   5363 __ai __attribute__((target("neon"))) poly16x8_t vaddq_p16(poly16x8_t __p0, poly16x8_t __p1) {
   5364   poly16x8_t __ret;
   5365   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5366   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5367   __ret = (poly16x8_t) __builtin_neon_vaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 37);
   5368   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5369   return __ret;
   5370 }
   5371 #endif
   5372 
   5373 #ifdef __LITTLE_ENDIAN__
   5374 __ai __attribute__((target("neon"))) uint16x4_t vaddhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5375   uint16x4_t __ret;
   5376   __ret = (uint16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
   5377   return __ret;
   5378 }
   5379 #else
   5380 __ai __attribute__((target("neon"))) uint16x4_t vaddhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5381   uint16x4_t __ret;
   5382   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5383   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5384   __ret = (uint16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17);
   5385   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5386   return __ret;
   5387 }
   5388 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vaddhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5389   uint16x4_t __ret;
   5390   __ret = (uint16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
   5391   return __ret;
   5392 }
   5393 #endif
   5394 
   5395 #ifdef __LITTLE_ENDIAN__
   5396 __ai __attribute__((target("neon"))) uint32x2_t vaddhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5397   uint32x2_t __ret;
   5398   __ret = (uint32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
   5399   return __ret;
   5400 }
   5401 #else
   5402 __ai __attribute__((target("neon"))) uint32x2_t vaddhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5403   uint32x2_t __ret;
   5404   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5405   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5406   __ret = (uint32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18);
   5407   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5408   return __ret;
   5409 }
   5410 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vaddhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5411   uint32x2_t __ret;
   5412   __ret = (uint32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
   5413   return __ret;
   5414 }
   5415 #endif
   5416 
   5417 #ifdef __LITTLE_ENDIAN__
   5418 __ai __attribute__((target("neon"))) uint8x8_t vaddhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5419   uint8x8_t __ret;
   5420   __ret = (uint8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
   5421   return __ret;
   5422 }
   5423 #else
   5424 __ai __attribute__((target("neon"))) uint8x8_t vaddhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5425   uint8x8_t __ret;
   5426   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5427   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5428   __ret = (uint8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16);
   5429   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5430   return __ret;
   5431 }
   5432 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vaddhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5433   uint8x8_t __ret;
   5434   __ret = (uint8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
   5435   return __ret;
   5436 }
   5437 #endif
   5438 
   5439 #ifdef __LITTLE_ENDIAN__
   5440 __ai __attribute__((target("neon"))) int16x4_t vaddhn_s32(int32x4_t __p0, int32x4_t __p1) {
   5441   int16x4_t __ret;
   5442   __ret = (int16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
   5443   return __ret;
   5444 }
   5445 #else
   5446 __ai __attribute__((target("neon"))) int16x4_t vaddhn_s32(int32x4_t __p0, int32x4_t __p1) {
   5447   int16x4_t __ret;
   5448   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5449   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5450   __ret = (int16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1);
   5451   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5452   return __ret;
   5453 }
   5454 __ai __attribute__((target("neon"))) int16x4_t __noswap_vaddhn_s32(int32x4_t __p0, int32x4_t __p1) {
   5455   int16x4_t __ret;
   5456   __ret = (int16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
   5457   return __ret;
   5458 }
   5459 #endif
   5460 
   5461 #ifdef __LITTLE_ENDIAN__
   5462 __ai __attribute__((target("neon"))) int32x2_t vaddhn_s64(int64x2_t __p0, int64x2_t __p1) {
   5463   int32x2_t __ret;
   5464   __ret = (int32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
   5465   return __ret;
   5466 }
   5467 #else
   5468 __ai __attribute__((target("neon"))) int32x2_t vaddhn_s64(int64x2_t __p0, int64x2_t __p1) {
   5469   int32x2_t __ret;
   5470   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5471   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5472   __ret = (int32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2);
   5473   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5474   return __ret;
   5475 }
   5476 __ai __attribute__((target("neon"))) int32x2_t __noswap_vaddhn_s64(int64x2_t __p0, int64x2_t __p1) {
   5477   int32x2_t __ret;
   5478   __ret = (int32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
   5479   return __ret;
   5480 }
   5481 #endif
   5482 
   5483 #ifdef __LITTLE_ENDIAN__
   5484 __ai __attribute__((target("neon"))) int8x8_t vaddhn_s16(int16x8_t __p0, int16x8_t __p1) {
   5485   int8x8_t __ret;
   5486   __ret = (int8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
   5487   return __ret;
   5488 }
   5489 #else
   5490 __ai __attribute__((target("neon"))) int8x8_t vaddhn_s16(int16x8_t __p0, int16x8_t __p1) {
   5491   int8x8_t __ret;
   5492   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5493   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5494   __ret = (int8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0);
   5495   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5496   return __ret;
   5497 }
   5498 __ai __attribute__((target("neon"))) int8x8_t __noswap_vaddhn_s16(int16x8_t __p0, int16x8_t __p1) {
   5499   int8x8_t __ret;
   5500   __ret = (int8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
   5501   return __ret;
   5502 }
   5503 #endif
   5504 
   5505 #ifdef __LITTLE_ENDIAN__
   5506 __ai __attribute__((target("neon"))) uint8x16_t vandq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   5507   uint8x16_t __ret;
   5508   __ret = __p0 & __p1;
   5509   return __ret;
   5510 }
   5511 #else
   5512 __ai __attribute__((target("neon"))) uint8x16_t vandq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   5513   uint8x16_t __ret;
   5514   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5515   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5516   __ret = __rev0 & __rev1;
   5517   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5518   return __ret;
   5519 }
   5520 #endif
   5521 
   5522 #ifdef __LITTLE_ENDIAN__
   5523 __ai __attribute__((target("neon"))) uint32x4_t vandq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5524   uint32x4_t __ret;
   5525   __ret = __p0 & __p1;
   5526   return __ret;
   5527 }
   5528 #else
   5529 __ai __attribute__((target("neon"))) uint32x4_t vandq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5530   uint32x4_t __ret;
   5531   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5532   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5533   __ret = __rev0 & __rev1;
   5534   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5535   return __ret;
   5536 }
   5537 #endif
   5538 
   5539 #ifdef __LITTLE_ENDIAN__
   5540 __ai __attribute__((target("neon"))) uint64x2_t vandq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5541   uint64x2_t __ret;
   5542   __ret = __p0 & __p1;
   5543   return __ret;
   5544 }
   5545 #else
   5546 __ai __attribute__((target("neon"))) uint64x2_t vandq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5547   uint64x2_t __ret;
   5548   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5549   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5550   __ret = __rev0 & __rev1;
   5551   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5552   return __ret;
   5553 }
   5554 #endif
   5555 
   5556 #ifdef __LITTLE_ENDIAN__
   5557 __ai __attribute__((target("neon"))) uint16x8_t vandq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5558   uint16x8_t __ret;
   5559   __ret = __p0 & __p1;
   5560   return __ret;
   5561 }
   5562 #else
   5563 __ai __attribute__((target("neon"))) uint16x8_t vandq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5564   uint16x8_t __ret;
   5565   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5566   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5567   __ret = __rev0 & __rev1;
   5568   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5569   return __ret;
   5570 }
   5571 #endif
   5572 
   5573 #ifdef __LITTLE_ENDIAN__
   5574 __ai __attribute__((target("neon"))) int8x16_t vandq_s8(int8x16_t __p0, int8x16_t __p1) {
   5575   int8x16_t __ret;
   5576   __ret = __p0 & __p1;
   5577   return __ret;
   5578 }
   5579 #else
   5580 __ai __attribute__((target("neon"))) int8x16_t vandq_s8(int8x16_t __p0, int8x16_t __p1) {
   5581   int8x16_t __ret;
   5582   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5583   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5584   __ret = __rev0 & __rev1;
   5585   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5586   return __ret;
   5587 }
   5588 #endif
   5589 
   5590 #ifdef __LITTLE_ENDIAN__
   5591 __ai __attribute__((target("neon"))) int32x4_t vandq_s32(int32x4_t __p0, int32x4_t __p1) {
   5592   int32x4_t __ret;
   5593   __ret = __p0 & __p1;
   5594   return __ret;
   5595 }
   5596 #else
   5597 __ai __attribute__((target("neon"))) int32x4_t vandq_s32(int32x4_t __p0, int32x4_t __p1) {
   5598   int32x4_t __ret;
   5599   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5600   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5601   __ret = __rev0 & __rev1;
   5602   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5603   return __ret;
   5604 }
   5605 #endif
   5606 
   5607 #ifdef __LITTLE_ENDIAN__
   5608 __ai __attribute__((target("neon"))) int64x2_t vandq_s64(int64x2_t __p0, int64x2_t __p1) {
   5609   int64x2_t __ret;
   5610   __ret = __p0 & __p1;
   5611   return __ret;
   5612 }
   5613 #else
   5614 __ai __attribute__((target("neon"))) int64x2_t vandq_s64(int64x2_t __p0, int64x2_t __p1) {
   5615   int64x2_t __ret;
   5616   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5617   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5618   __ret = __rev0 & __rev1;
   5619   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5620   return __ret;
   5621 }
   5622 #endif
   5623 
   5624 #ifdef __LITTLE_ENDIAN__
   5625 __ai __attribute__((target("neon"))) int16x8_t vandq_s16(int16x8_t __p0, int16x8_t __p1) {
   5626   int16x8_t __ret;
   5627   __ret = __p0 & __p1;
   5628   return __ret;
   5629 }
   5630 #else
   5631 __ai __attribute__((target("neon"))) int16x8_t vandq_s16(int16x8_t __p0, int16x8_t __p1) {
   5632   int16x8_t __ret;
   5633   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5634   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5635   __ret = __rev0 & __rev1;
   5636   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5637   return __ret;
   5638 }
   5639 #endif
   5640 
   5641 #ifdef __LITTLE_ENDIAN__
   5642 __ai __attribute__((target("neon"))) uint8x8_t vand_u8(uint8x8_t __p0, uint8x8_t __p1) {
   5643   uint8x8_t __ret;
   5644   __ret = __p0 & __p1;
   5645   return __ret;
   5646 }
   5647 #else
   5648 __ai __attribute__((target("neon"))) uint8x8_t vand_u8(uint8x8_t __p0, uint8x8_t __p1) {
   5649   uint8x8_t __ret;
   5650   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5651   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5652   __ret = __rev0 & __rev1;
   5653   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5654   return __ret;
   5655 }
   5656 #endif
   5657 
   5658 #ifdef __LITTLE_ENDIAN__
   5659 __ai __attribute__((target("neon"))) uint32x2_t vand_u32(uint32x2_t __p0, uint32x2_t __p1) {
   5660   uint32x2_t __ret;
   5661   __ret = __p0 & __p1;
   5662   return __ret;
   5663 }
   5664 #else
   5665 __ai __attribute__((target("neon"))) uint32x2_t vand_u32(uint32x2_t __p0, uint32x2_t __p1) {
   5666   uint32x2_t __ret;
   5667   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5668   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5669   __ret = __rev0 & __rev1;
   5670   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5671   return __ret;
   5672 }
   5673 #endif
   5674 
   5675 __ai __attribute__((target("neon"))) uint64x1_t vand_u64(uint64x1_t __p0, uint64x1_t __p1) {
   5676   uint64x1_t __ret;
   5677   __ret = __p0 & __p1;
   5678   return __ret;
   5679 }
   5680 #ifdef __LITTLE_ENDIAN__
   5681 __ai __attribute__((target("neon"))) uint16x4_t vand_u16(uint16x4_t __p0, uint16x4_t __p1) {
   5682   uint16x4_t __ret;
   5683   __ret = __p0 & __p1;
   5684   return __ret;
   5685 }
   5686 #else
   5687 __ai __attribute__((target("neon"))) uint16x4_t vand_u16(uint16x4_t __p0, uint16x4_t __p1) {
   5688   uint16x4_t __ret;
   5689   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5690   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5691   __ret = __rev0 & __rev1;
   5692   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5693   return __ret;
   5694 }
   5695 #endif
   5696 
   5697 #ifdef __LITTLE_ENDIAN__
   5698 __ai __attribute__((target("neon"))) int8x8_t vand_s8(int8x8_t __p0, int8x8_t __p1) {
   5699   int8x8_t __ret;
   5700   __ret = __p0 & __p1;
   5701   return __ret;
   5702 }
   5703 #else
   5704 __ai __attribute__((target("neon"))) int8x8_t vand_s8(int8x8_t __p0, int8x8_t __p1) {
   5705   int8x8_t __ret;
   5706   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5707   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5708   __ret = __rev0 & __rev1;
   5709   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5710   return __ret;
   5711 }
   5712 #endif
   5713 
   5714 #ifdef __LITTLE_ENDIAN__
   5715 __ai __attribute__((target("neon"))) int32x2_t vand_s32(int32x2_t __p0, int32x2_t __p1) {
   5716   int32x2_t __ret;
   5717   __ret = __p0 & __p1;
   5718   return __ret;
   5719 }
   5720 #else
   5721 __ai __attribute__((target("neon"))) int32x2_t vand_s32(int32x2_t __p0, int32x2_t __p1) {
   5722   int32x2_t __ret;
   5723   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5724   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5725   __ret = __rev0 & __rev1;
   5726   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5727   return __ret;
   5728 }
   5729 #endif
   5730 
   5731 __ai __attribute__((target("neon"))) int64x1_t vand_s64(int64x1_t __p0, int64x1_t __p1) {
   5732   int64x1_t __ret;
   5733   __ret = __p0 & __p1;
   5734   return __ret;
   5735 }
   5736 #ifdef __LITTLE_ENDIAN__
   5737 __ai __attribute__((target("neon"))) int16x4_t vand_s16(int16x4_t __p0, int16x4_t __p1) {
   5738   int16x4_t __ret;
   5739   __ret = __p0 & __p1;
   5740   return __ret;
   5741 }
   5742 #else
   5743 __ai __attribute__((target("neon"))) int16x4_t vand_s16(int16x4_t __p0, int16x4_t __p1) {
   5744   int16x4_t __ret;
   5745   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5746   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5747   __ret = __rev0 & __rev1;
   5748   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5749   return __ret;
   5750 }
   5751 #endif
   5752 
   5753 #ifdef __LITTLE_ENDIAN__
   5754 __ai __attribute__((target("neon"))) uint8x16_t vbicq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   5755   uint8x16_t __ret;
   5756   __ret = __p0 & ~__p1;
   5757   return __ret;
   5758 }
   5759 #else
   5760 __ai __attribute__((target("neon"))) uint8x16_t vbicq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   5761   uint8x16_t __ret;
   5762   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5763   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5764   __ret = __rev0 & ~__rev1;
   5765   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5766   return __ret;
   5767 }
   5768 #endif
   5769 
   5770 #ifdef __LITTLE_ENDIAN__
   5771 __ai __attribute__((target("neon"))) uint32x4_t vbicq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5772   uint32x4_t __ret;
   5773   __ret = __p0 & ~__p1;
   5774   return __ret;
   5775 }
   5776 #else
   5777 __ai __attribute__((target("neon"))) uint32x4_t vbicq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   5778   uint32x4_t __ret;
   5779   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5780   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5781   __ret = __rev0 & ~__rev1;
   5782   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5783   return __ret;
   5784 }
   5785 #endif
   5786 
   5787 #ifdef __LITTLE_ENDIAN__
   5788 __ai __attribute__((target("neon"))) uint64x2_t vbicq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5789   uint64x2_t __ret;
   5790   __ret = __p0 & ~__p1;
   5791   return __ret;
   5792 }
   5793 #else
   5794 __ai __attribute__((target("neon"))) uint64x2_t vbicq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   5795   uint64x2_t __ret;
   5796   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5797   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5798   __ret = __rev0 & ~__rev1;
   5799   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5800   return __ret;
   5801 }
   5802 #endif
   5803 
   5804 #ifdef __LITTLE_ENDIAN__
   5805 __ai __attribute__((target("neon"))) uint16x8_t vbicq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5806   uint16x8_t __ret;
   5807   __ret = __p0 & ~__p1;
   5808   return __ret;
   5809 }
   5810 #else
   5811 __ai __attribute__((target("neon"))) uint16x8_t vbicq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   5812   uint16x8_t __ret;
   5813   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5814   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5815   __ret = __rev0 & ~__rev1;
   5816   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5817   return __ret;
   5818 }
   5819 #endif
   5820 
   5821 #ifdef __LITTLE_ENDIAN__
   5822 __ai __attribute__((target("neon"))) int8x16_t vbicq_s8(int8x16_t __p0, int8x16_t __p1) {
   5823   int8x16_t __ret;
   5824   __ret = __p0 & ~__p1;
   5825   return __ret;
   5826 }
   5827 #else
   5828 __ai __attribute__((target("neon"))) int8x16_t vbicq_s8(int8x16_t __p0, int8x16_t __p1) {
   5829   int8x16_t __ret;
   5830   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5831   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5832   __ret = __rev0 & ~__rev1;
   5833   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   5834   return __ret;
   5835 }
   5836 #endif
   5837 
   5838 #ifdef __LITTLE_ENDIAN__
   5839 __ai __attribute__((target("neon"))) int32x4_t vbicq_s32(int32x4_t __p0, int32x4_t __p1) {
   5840   int32x4_t __ret;
   5841   __ret = __p0 & ~__p1;
   5842   return __ret;
   5843 }
   5844 #else
   5845 __ai __attribute__((target("neon"))) int32x4_t vbicq_s32(int32x4_t __p0, int32x4_t __p1) {
   5846   int32x4_t __ret;
   5847   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5848   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5849   __ret = __rev0 & ~__rev1;
   5850   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5851   return __ret;
   5852 }
   5853 #endif
   5854 
   5855 #ifdef __LITTLE_ENDIAN__
   5856 __ai __attribute__((target("neon"))) int64x2_t vbicq_s64(int64x2_t __p0, int64x2_t __p1) {
   5857   int64x2_t __ret;
   5858   __ret = __p0 & ~__p1;
   5859   return __ret;
   5860 }
   5861 #else
   5862 __ai __attribute__((target("neon"))) int64x2_t vbicq_s64(int64x2_t __p0, int64x2_t __p1) {
   5863   int64x2_t __ret;
   5864   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5865   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5866   __ret = __rev0 & ~__rev1;
   5867   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5868   return __ret;
   5869 }
   5870 #endif
   5871 
   5872 #ifdef __LITTLE_ENDIAN__
   5873 __ai __attribute__((target("neon"))) int16x8_t vbicq_s16(int16x8_t __p0, int16x8_t __p1) {
   5874   int16x8_t __ret;
   5875   __ret = __p0 & ~__p1;
   5876   return __ret;
   5877 }
   5878 #else
   5879 __ai __attribute__((target("neon"))) int16x8_t vbicq_s16(int16x8_t __p0, int16x8_t __p1) {
   5880   int16x8_t __ret;
   5881   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5882   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5883   __ret = __rev0 & ~__rev1;
   5884   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5885   return __ret;
   5886 }
   5887 #endif
   5888 
   5889 #ifdef __LITTLE_ENDIAN__
   5890 __ai __attribute__((target("neon"))) uint8x8_t vbic_u8(uint8x8_t __p0, uint8x8_t __p1) {
   5891   uint8x8_t __ret;
   5892   __ret = __p0 & ~__p1;
   5893   return __ret;
   5894 }
   5895 #else
   5896 __ai __attribute__((target("neon"))) uint8x8_t vbic_u8(uint8x8_t __p0, uint8x8_t __p1) {
   5897   uint8x8_t __ret;
   5898   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5899   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5900   __ret = __rev0 & ~__rev1;
   5901   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5902   return __ret;
   5903 }
   5904 #endif
   5905 
   5906 #ifdef __LITTLE_ENDIAN__
   5907 __ai __attribute__((target("neon"))) uint32x2_t vbic_u32(uint32x2_t __p0, uint32x2_t __p1) {
   5908   uint32x2_t __ret;
   5909   __ret = __p0 & ~__p1;
   5910   return __ret;
   5911 }
   5912 #else
   5913 __ai __attribute__((target("neon"))) uint32x2_t vbic_u32(uint32x2_t __p0, uint32x2_t __p1) {
   5914   uint32x2_t __ret;
   5915   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5916   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5917   __ret = __rev0 & ~__rev1;
   5918   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5919   return __ret;
   5920 }
   5921 #endif
   5922 
   5923 __ai __attribute__((target("neon"))) uint64x1_t vbic_u64(uint64x1_t __p0, uint64x1_t __p1) {
   5924   uint64x1_t __ret;
   5925   __ret = __p0 & ~__p1;
   5926   return __ret;
   5927 }
   5928 #ifdef __LITTLE_ENDIAN__
   5929 __ai __attribute__((target("neon"))) uint16x4_t vbic_u16(uint16x4_t __p0, uint16x4_t __p1) {
   5930   uint16x4_t __ret;
   5931   __ret = __p0 & ~__p1;
   5932   return __ret;
   5933 }
   5934 #else
   5935 __ai __attribute__((target("neon"))) uint16x4_t vbic_u16(uint16x4_t __p0, uint16x4_t __p1) {
   5936   uint16x4_t __ret;
   5937   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5938   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5939   __ret = __rev0 & ~__rev1;
   5940   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5941   return __ret;
   5942 }
   5943 #endif
   5944 
   5945 #ifdef __LITTLE_ENDIAN__
   5946 __ai __attribute__((target("neon"))) int8x8_t vbic_s8(int8x8_t __p0, int8x8_t __p1) {
   5947   int8x8_t __ret;
   5948   __ret = __p0 & ~__p1;
   5949   return __ret;
   5950 }
   5951 #else
   5952 __ai __attribute__((target("neon"))) int8x8_t vbic_s8(int8x8_t __p0, int8x8_t __p1) {
   5953   int8x8_t __ret;
   5954   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   5955   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   5956   __ret = __rev0 & ~__rev1;
   5957   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   5958   return __ret;
   5959 }
   5960 #endif
   5961 
   5962 #ifdef __LITTLE_ENDIAN__
   5963 __ai __attribute__((target("neon"))) int32x2_t vbic_s32(int32x2_t __p0, int32x2_t __p1) {
   5964   int32x2_t __ret;
   5965   __ret = __p0 & ~__p1;
   5966   return __ret;
   5967 }
   5968 #else
   5969 __ai __attribute__((target("neon"))) int32x2_t vbic_s32(int32x2_t __p0, int32x2_t __p1) {
   5970   int32x2_t __ret;
   5971   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   5972   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   5973   __ret = __rev0 & ~__rev1;
   5974   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   5975   return __ret;
   5976 }
   5977 #endif
   5978 
   5979 __ai __attribute__((target("neon"))) int64x1_t vbic_s64(int64x1_t __p0, int64x1_t __p1) {
   5980   int64x1_t __ret;
   5981   __ret = __p0 & ~__p1;
   5982   return __ret;
   5983 }
   5984 #ifdef __LITTLE_ENDIAN__
   5985 __ai __attribute__((target("neon"))) int16x4_t vbic_s16(int16x4_t __p0, int16x4_t __p1) {
   5986   int16x4_t __ret;
   5987   __ret = __p0 & ~__p1;
   5988   return __ret;
   5989 }
   5990 #else
   5991 __ai __attribute__((target("neon"))) int16x4_t vbic_s16(int16x4_t __p0, int16x4_t __p1) {
   5992   int16x4_t __ret;
   5993   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   5994   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   5995   __ret = __rev0 & ~__rev1;
   5996   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   5997   return __ret;
   5998 }
   5999 #endif
   6000 
   6001 #ifdef __LITTLE_ENDIAN__
   6002 __ai __attribute__((target("neon"))) poly8x8_t vbsl_p8(uint8x8_t __p0, poly8x8_t __p1, poly8x8_t __p2) {
   6003   poly8x8_t __ret;
   6004   __ret = (poly8x8_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 4);
   6005   return __ret;
   6006 }
   6007 #else
   6008 __ai __attribute__((target("neon"))) poly8x8_t vbsl_p8(uint8x8_t __p0, poly8x8_t __p1, poly8x8_t __p2) {
   6009   poly8x8_t __ret;
   6010   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6011   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6012   poly8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6013   __ret = (poly8x8_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 4);
   6014   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6015   return __ret;
   6016 }
   6017 #endif
   6018 
   6019 #ifdef __LITTLE_ENDIAN__
   6020 __ai __attribute__((target("neon"))) poly16x4_t vbsl_p16(uint16x4_t __p0, poly16x4_t __p1, poly16x4_t __p2) {
   6021   poly16x4_t __ret;
   6022   __ret = (poly16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 5);
   6023   return __ret;
   6024 }
   6025 #else
   6026 __ai __attribute__((target("neon"))) poly16x4_t vbsl_p16(uint16x4_t __p0, poly16x4_t __p1, poly16x4_t __p2) {
   6027   poly16x4_t __ret;
   6028   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6029   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6030   poly16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6031   __ret = (poly16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 5);
   6032   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6033   return __ret;
   6034 }
   6035 #endif
   6036 
   6037 #ifdef __LITTLE_ENDIAN__
   6038 __ai __attribute__((target("neon"))) poly8x16_t vbslq_p8(uint8x16_t __p0, poly8x16_t __p1, poly8x16_t __p2) {
   6039   poly8x16_t __ret;
   6040   __ret = (poly8x16_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 36);
   6041   return __ret;
   6042 }
   6043 #else
   6044 __ai __attribute__((target("neon"))) poly8x16_t vbslq_p8(uint8x16_t __p0, poly8x16_t __p1, poly8x16_t __p2) {
   6045   poly8x16_t __ret;
   6046   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6047   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6048   poly8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6049   __ret = (poly8x16_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 36);
   6050   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6051   return __ret;
   6052 }
   6053 #endif
   6054 
   6055 #ifdef __LITTLE_ENDIAN__
   6056 __ai __attribute__((target("neon"))) poly16x8_t vbslq_p16(uint16x8_t __p0, poly16x8_t __p1, poly16x8_t __p2) {
   6057   poly16x8_t __ret;
   6058   __ret = (poly16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 37);
   6059   return __ret;
   6060 }
   6061 #else
   6062 __ai __attribute__((target("neon"))) poly16x8_t vbslq_p16(uint16x8_t __p0, poly16x8_t __p1, poly16x8_t __p2) {
   6063   poly16x8_t __ret;
   6064   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6065   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6066   poly16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6067   __ret = (poly16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 37);
   6068   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6069   return __ret;
   6070 }
   6071 #endif
   6072 
   6073 #ifdef __LITTLE_ENDIAN__
   6074 __ai __attribute__((target("neon"))) uint8x16_t vbslq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   6075   uint8x16_t __ret;
   6076   __ret = (uint8x16_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48);
   6077   return __ret;
   6078 }
   6079 #else
   6080 __ai __attribute__((target("neon"))) uint8x16_t vbslq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
   6081   uint8x16_t __ret;
   6082   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6083   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6084   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6085   __ret = (uint8x16_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48);
   6086   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6087   return __ret;
   6088 }
   6089 #endif
   6090 
   6091 #ifdef __LITTLE_ENDIAN__
   6092 __ai __attribute__((target("neon"))) uint32x4_t vbslq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
   6093   uint32x4_t __ret;
   6094   __ret = (uint32x4_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
   6095   return __ret;
   6096 }
   6097 #else
   6098 __ai __attribute__((target("neon"))) uint32x4_t vbslq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
   6099   uint32x4_t __ret;
   6100   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6101   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6102   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6103   __ret = (uint32x4_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
   6104   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6105   return __ret;
   6106 }
   6107 #endif
   6108 
   6109 #ifdef __LITTLE_ENDIAN__
   6110 __ai __attribute__((target("neon"))) uint64x2_t vbslq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
   6111   uint64x2_t __ret;
   6112   __ret = (uint64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51);
   6113   return __ret;
   6114 }
   6115 #else
   6116 __ai __attribute__((target("neon"))) uint64x2_t vbslq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
   6117   uint64x2_t __ret;
   6118   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6119   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6120   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
   6121   __ret = (uint64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51);
   6122   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6123   return __ret;
   6124 }
   6125 #endif
   6126 
   6127 #ifdef __LITTLE_ENDIAN__
   6128 __ai __attribute__((target("neon"))) uint16x8_t vbslq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
   6129   uint16x8_t __ret;
   6130   __ret = (uint16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 49);
   6131   return __ret;
   6132 }
   6133 #else
   6134 __ai __attribute__((target("neon"))) uint16x8_t vbslq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
   6135   uint16x8_t __ret;
   6136   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6137   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6138   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6139   __ret = (uint16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 49);
   6140   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6141   return __ret;
   6142 }
   6143 #endif
   6144 
   6145 #ifdef __LITTLE_ENDIAN__
   6146 __ai __attribute__((target("neon"))) int8x16_t vbslq_s8(uint8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
   6147   int8x16_t __ret;
   6148   __ret = (int8x16_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32);
   6149   return __ret;
   6150 }
   6151 #else
   6152 __ai __attribute__((target("neon"))) int8x16_t vbslq_s8(uint8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
   6153   int8x16_t __ret;
   6154   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6155   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6156   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6157   __ret = (int8x16_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32);
   6158   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6159   return __ret;
   6160 }
   6161 #endif
   6162 
   6163 #ifdef __LITTLE_ENDIAN__
   6164 __ai __attribute__((target("neon"))) float32x4_t vbslq_f32(uint32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
   6165   float32x4_t __ret;
   6166   __ret = (float32x4_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
   6167   return __ret;
   6168 }
   6169 #else
   6170 __ai __attribute__((target("neon"))) float32x4_t vbslq_f32(uint32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
   6171   float32x4_t __ret;
   6172   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6173   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6174   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6175   __ret = (float32x4_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
   6176   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6177   return __ret;
   6178 }
   6179 #endif
   6180 
   6181 #ifdef __LITTLE_ENDIAN__
   6182 __ai __attribute__((target("neon"))) int32x4_t vbslq_s32(uint32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
   6183   int32x4_t __ret;
   6184   __ret = (int32x4_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
   6185   return __ret;
   6186 }
   6187 #else
   6188 __ai __attribute__((target("neon"))) int32x4_t vbslq_s32(uint32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
   6189   int32x4_t __ret;
   6190   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6191   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6192   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6193   __ret = (int32x4_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
   6194   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6195   return __ret;
   6196 }
   6197 #endif
   6198 
   6199 #ifdef __LITTLE_ENDIAN__
   6200 __ai __attribute__((target("neon"))) int64x2_t vbslq_s64(uint64x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
   6201   int64x2_t __ret;
   6202   __ret = (int64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 35);
   6203   return __ret;
   6204 }
   6205 #else
   6206 __ai __attribute__((target("neon"))) int64x2_t vbslq_s64(uint64x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
   6207   int64x2_t __ret;
   6208   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6209   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6210   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
   6211   __ret = (int64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 35);
   6212   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6213   return __ret;
   6214 }
   6215 #endif
   6216 
   6217 #ifdef __LITTLE_ENDIAN__
   6218 __ai __attribute__((target("neon"))) int16x8_t vbslq_s16(uint16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
   6219   int16x8_t __ret;
   6220   __ret = (int16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
   6221   return __ret;
   6222 }
   6223 #else
   6224 __ai __attribute__((target("neon"))) int16x8_t vbslq_s16(uint16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
   6225   int16x8_t __ret;
   6226   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6227   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6228   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6229   __ret = (int16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33);
   6230   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6231   return __ret;
   6232 }
   6233 #endif
   6234 
   6235 #ifdef __LITTLE_ENDIAN__
   6236 __ai __attribute__((target("neon"))) uint8x8_t vbsl_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
   6237   uint8x8_t __ret;
   6238   __ret = (uint8x8_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 16);
   6239   return __ret;
   6240 }
   6241 #else
   6242 __ai __attribute__((target("neon"))) uint8x8_t vbsl_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
   6243   uint8x8_t __ret;
   6244   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6245   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6246   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6247   __ret = (uint8x8_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 16);
   6248   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6249   return __ret;
   6250 }
   6251 #endif
   6252 
   6253 #ifdef __LITTLE_ENDIAN__
   6254 __ai __attribute__((target("neon"))) uint32x2_t vbsl_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
   6255   uint32x2_t __ret;
   6256   __ret = (uint32x2_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 18);
   6257   return __ret;
   6258 }
   6259 #else
   6260 __ai __attribute__((target("neon"))) uint32x2_t vbsl_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
   6261   uint32x2_t __ret;
   6262   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6263   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6264   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
   6265   __ret = (uint32x2_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 18);
   6266   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6267   return __ret;
   6268 }
   6269 #endif
   6270 
   6271 __ai __attribute__((target("neon"))) uint64x1_t vbsl_u64(uint64x1_t __p0, uint64x1_t __p1, uint64x1_t __p2) {
   6272   uint64x1_t __ret;
   6273   __ret = (uint64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 19);
   6274   return __ret;
   6275 }
   6276 #ifdef __LITTLE_ENDIAN__
   6277 __ai __attribute__((target("neon"))) uint16x4_t vbsl_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
   6278   uint16x4_t __ret;
   6279   __ret = (uint16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 17);
   6280   return __ret;
   6281 }
   6282 #else
   6283 __ai __attribute__((target("neon"))) uint16x4_t vbsl_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
   6284   uint16x4_t __ret;
   6285   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6286   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6287   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6288   __ret = (uint16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 17);
   6289   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6290   return __ret;
   6291 }
   6292 #endif
   6293 
   6294 #ifdef __LITTLE_ENDIAN__
   6295 __ai __attribute__((target("neon"))) int8x8_t vbsl_s8(uint8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
   6296   int8x8_t __ret;
   6297   __ret = (int8x8_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 0);
   6298   return __ret;
   6299 }
   6300 #else
   6301 __ai __attribute__((target("neon"))) int8x8_t vbsl_s8(uint8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
   6302   int8x8_t __ret;
   6303   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6304   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6305   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6306   __ret = (int8x8_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 0);
   6307   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6308   return __ret;
   6309 }
   6310 #endif
   6311 
   6312 #ifdef __LITTLE_ENDIAN__
   6313 __ai __attribute__((target("neon"))) float32x2_t vbsl_f32(uint32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
   6314   float32x2_t __ret;
   6315   __ret = (float32x2_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
   6316   return __ret;
   6317 }
   6318 #else
   6319 __ai __attribute__((target("neon"))) float32x2_t vbsl_f32(uint32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
   6320   float32x2_t __ret;
   6321   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6322   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6323   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
   6324   __ret = (float32x2_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
   6325   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6326   return __ret;
   6327 }
   6328 #endif
   6329 
   6330 #ifdef __LITTLE_ENDIAN__
   6331 __ai __attribute__((target("neon"))) int32x2_t vbsl_s32(uint32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
   6332   int32x2_t __ret;
   6333   __ret = (int32x2_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
   6334   return __ret;
   6335 }
   6336 #else
   6337 __ai __attribute__((target("neon"))) int32x2_t vbsl_s32(uint32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
   6338   int32x2_t __ret;
   6339   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6340   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6341   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
   6342   __ret = (int32x2_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2);
   6343   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6344   return __ret;
   6345 }
   6346 #endif
   6347 
   6348 __ai __attribute__((target("neon"))) int64x1_t vbsl_s64(uint64x1_t __p0, int64x1_t __p1, int64x1_t __p2) {
   6349   int64x1_t __ret;
   6350   __ret = (int64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 3);
   6351   return __ret;
   6352 }
   6353 #ifdef __LITTLE_ENDIAN__
   6354 __ai __attribute__((target("neon"))) int16x4_t vbsl_s16(uint16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
   6355   int16x4_t __ret;
   6356   __ret = (int16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1);
   6357   return __ret;
   6358 }
   6359 #else
   6360 __ai __attribute__((target("neon"))) int16x4_t vbsl_s16(uint16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
   6361   int16x4_t __ret;
   6362   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6363   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6364   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6365   __ret = (int16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 1);
   6366   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6367   return __ret;
   6368 }
   6369 #endif
   6370 
   6371 #ifdef __LITTLE_ENDIAN__
   6372 __ai __attribute__((target("neon"))) float16x8_t vbslq_f16(uint16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   6373   float16x8_t __ret;
   6374   __ret = (float16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
   6375   return __ret;
   6376 }
   6377 #else
   6378 __ai __attribute__((target("neon"))) float16x8_t vbslq_f16(uint16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
   6379   float16x8_t __ret;
   6380   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6381   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6382   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
   6383   __ret = (float16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40);
   6384   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6385   return __ret;
   6386 }
   6387 #endif
   6388 
   6389 #ifdef __LITTLE_ENDIAN__
   6390 __ai __attribute__((target("neon"))) float16x4_t vbsl_f16(uint16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   6391   float16x4_t __ret;
   6392   __ret = (float16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
   6393   return __ret;
   6394 }
   6395 #else
   6396 __ai __attribute__((target("neon"))) float16x4_t vbsl_f16(uint16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
   6397   float16x4_t __ret;
   6398   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6399   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6400   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
   6401   __ret = (float16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8);
   6402   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6403   return __ret;
   6404 }
   6405 #endif
   6406 
   6407 #ifdef __LITTLE_ENDIAN__
   6408 __ai __attribute__((target("neon"))) uint32x4_t vcageq_f32(float32x4_t __p0, float32x4_t __p1) {
   6409   uint32x4_t __ret;
   6410   __ret = (uint32x4_t) __builtin_neon_vcageq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
   6411   return __ret;
   6412 }
   6413 #else
   6414 __ai __attribute__((target("neon"))) uint32x4_t vcageq_f32(float32x4_t __p0, float32x4_t __p1) {
   6415   uint32x4_t __ret;
   6416   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6417   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6418   __ret = (uint32x4_t) __builtin_neon_vcageq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
   6419   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6420   return __ret;
   6421 }
   6422 #endif
   6423 
   6424 #ifdef __LITTLE_ENDIAN__
   6425 __ai __attribute__((target("neon"))) uint32x2_t vcage_f32(float32x2_t __p0, float32x2_t __p1) {
   6426   uint32x2_t __ret;
   6427   __ret = (uint32x2_t) __builtin_neon_vcage_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
   6428   return __ret;
   6429 }
   6430 #else
   6431 __ai __attribute__((target("neon"))) uint32x2_t vcage_f32(float32x2_t __p0, float32x2_t __p1) {
   6432   uint32x2_t __ret;
   6433   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6434   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6435   __ret = (uint32x2_t) __builtin_neon_vcage_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
   6436   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6437   return __ret;
   6438 }
   6439 #endif
   6440 
   6441 #ifdef __LITTLE_ENDIAN__
   6442 __ai __attribute__((target("neon"))) uint32x4_t vcagtq_f32(float32x4_t __p0, float32x4_t __p1) {
   6443   uint32x4_t __ret;
   6444   __ret = (uint32x4_t) __builtin_neon_vcagtq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
   6445   return __ret;
   6446 }
   6447 #else
   6448 __ai __attribute__((target("neon"))) uint32x4_t vcagtq_f32(float32x4_t __p0, float32x4_t __p1) {
   6449   uint32x4_t __ret;
   6450   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6451   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6452   __ret = (uint32x4_t) __builtin_neon_vcagtq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
   6453   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6454   return __ret;
   6455 }
   6456 #endif
   6457 
   6458 #ifdef __LITTLE_ENDIAN__
   6459 __ai __attribute__((target("neon"))) uint32x2_t vcagt_f32(float32x2_t __p0, float32x2_t __p1) {
   6460   uint32x2_t __ret;
   6461   __ret = (uint32x2_t) __builtin_neon_vcagt_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
   6462   return __ret;
   6463 }
   6464 #else
   6465 __ai __attribute__((target("neon"))) uint32x2_t vcagt_f32(float32x2_t __p0, float32x2_t __p1) {
   6466   uint32x2_t __ret;
   6467   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6468   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6469   __ret = (uint32x2_t) __builtin_neon_vcagt_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
   6470   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6471   return __ret;
   6472 }
   6473 #endif
   6474 
   6475 #ifdef __LITTLE_ENDIAN__
   6476 __ai __attribute__((target("neon"))) uint32x4_t vcaleq_f32(float32x4_t __p0, float32x4_t __p1) {
   6477   uint32x4_t __ret;
   6478   __ret = (uint32x4_t) __builtin_neon_vcaleq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
   6479   return __ret;
   6480 }
   6481 #else
   6482 __ai __attribute__((target("neon"))) uint32x4_t vcaleq_f32(float32x4_t __p0, float32x4_t __p1) {
   6483   uint32x4_t __ret;
   6484   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6485   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6486   __ret = (uint32x4_t) __builtin_neon_vcaleq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
   6487   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6488   return __ret;
   6489 }
   6490 #endif
   6491 
   6492 #ifdef __LITTLE_ENDIAN__
   6493 __ai __attribute__((target("neon"))) uint32x2_t vcale_f32(float32x2_t __p0, float32x2_t __p1) {
   6494   uint32x2_t __ret;
   6495   __ret = (uint32x2_t) __builtin_neon_vcale_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
   6496   return __ret;
   6497 }
   6498 #else
   6499 __ai __attribute__((target("neon"))) uint32x2_t vcale_f32(float32x2_t __p0, float32x2_t __p1) {
   6500   uint32x2_t __ret;
   6501   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6502   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6503   __ret = (uint32x2_t) __builtin_neon_vcale_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
   6504   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6505   return __ret;
   6506 }
   6507 #endif
   6508 
   6509 #ifdef __LITTLE_ENDIAN__
   6510 __ai __attribute__((target("neon"))) uint32x4_t vcaltq_f32(float32x4_t __p0, float32x4_t __p1) {
   6511   uint32x4_t __ret;
   6512   __ret = (uint32x4_t) __builtin_neon_vcaltq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
   6513   return __ret;
   6514 }
   6515 #else
   6516 __ai __attribute__((target("neon"))) uint32x4_t vcaltq_f32(float32x4_t __p0, float32x4_t __p1) {
   6517   uint32x4_t __ret;
   6518   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6519   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6520   __ret = (uint32x4_t) __builtin_neon_vcaltq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
   6521   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6522   return __ret;
   6523 }
   6524 #endif
   6525 
   6526 #ifdef __LITTLE_ENDIAN__
   6527 __ai __attribute__((target("neon"))) uint32x2_t vcalt_f32(float32x2_t __p0, float32x2_t __p1) {
   6528   uint32x2_t __ret;
   6529   __ret = (uint32x2_t) __builtin_neon_vcalt_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
   6530   return __ret;
   6531 }
   6532 #else
   6533 __ai __attribute__((target("neon"))) uint32x2_t vcalt_f32(float32x2_t __p0, float32x2_t __p1) {
   6534   uint32x2_t __ret;
   6535   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6536   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6537   __ret = (uint32x2_t) __builtin_neon_vcalt_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
   6538   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6539   return __ret;
   6540 }
   6541 #endif
   6542 
   6543 #ifdef __LITTLE_ENDIAN__
   6544 __ai __attribute__((target("neon"))) uint8x8_t vceq_p8(poly8x8_t __p0, poly8x8_t __p1) {
   6545   uint8x8_t __ret;
   6546   __ret = (uint8x8_t)(__p0 == __p1);
   6547   return __ret;
   6548 }
   6549 #else
   6550 __ai __attribute__((target("neon"))) uint8x8_t vceq_p8(poly8x8_t __p0, poly8x8_t __p1) {
   6551   uint8x8_t __ret;
   6552   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6553   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6554   __ret = (uint8x8_t)(__rev0 == __rev1);
   6555   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6556   return __ret;
   6557 }
   6558 #endif
   6559 
   6560 #ifdef __LITTLE_ENDIAN__
   6561 __ai __attribute__((target("neon"))) uint8x16_t vceqq_p8(poly8x16_t __p0, poly8x16_t __p1) {
   6562   uint8x16_t __ret;
   6563   __ret = (uint8x16_t)(__p0 == __p1);
   6564   return __ret;
   6565 }
   6566 #else
   6567 __ai __attribute__((target("neon"))) uint8x16_t vceqq_p8(poly8x16_t __p0, poly8x16_t __p1) {
   6568   uint8x16_t __ret;
   6569   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6570   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6571   __ret = (uint8x16_t)(__rev0 == __rev1);
   6572   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6573   return __ret;
   6574 }
   6575 #endif
   6576 
   6577 #ifdef __LITTLE_ENDIAN__
   6578 __ai __attribute__((target("neon"))) uint8x16_t vceqq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   6579   uint8x16_t __ret;
   6580   __ret = (uint8x16_t)(__p0 == __p1);
   6581   return __ret;
   6582 }
   6583 #else
   6584 __ai __attribute__((target("neon"))) uint8x16_t vceqq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   6585   uint8x16_t __ret;
   6586   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6587   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6588   __ret = (uint8x16_t)(__rev0 == __rev1);
   6589   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6590   return __ret;
   6591 }
   6592 #endif
   6593 
   6594 #ifdef __LITTLE_ENDIAN__
   6595 __ai __attribute__((target("neon"))) uint32x4_t vceqq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   6596   uint32x4_t __ret;
   6597   __ret = (uint32x4_t)(__p0 == __p1);
   6598   return __ret;
   6599 }
   6600 #else
   6601 __ai __attribute__((target("neon"))) uint32x4_t vceqq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   6602   uint32x4_t __ret;
   6603   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6604   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6605   __ret = (uint32x4_t)(__rev0 == __rev1);
   6606   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6607   return __ret;
   6608 }
   6609 #endif
   6610 
   6611 #ifdef __LITTLE_ENDIAN__
   6612 __ai __attribute__((target("neon"))) uint16x8_t vceqq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   6613   uint16x8_t __ret;
   6614   __ret = (uint16x8_t)(__p0 == __p1);
   6615   return __ret;
   6616 }
   6617 #else
   6618 __ai __attribute__((target("neon"))) uint16x8_t vceqq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   6619   uint16x8_t __ret;
   6620   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6621   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6622   __ret = (uint16x8_t)(__rev0 == __rev1);
   6623   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6624   return __ret;
   6625 }
   6626 #endif
   6627 
   6628 #ifdef __LITTLE_ENDIAN__
   6629 __ai __attribute__((target("neon"))) uint8x16_t vceqq_s8(int8x16_t __p0, int8x16_t __p1) {
   6630   uint8x16_t __ret;
   6631   __ret = (uint8x16_t)(__p0 == __p1);
   6632   return __ret;
   6633 }
   6634 #else
   6635 __ai __attribute__((target("neon"))) uint8x16_t vceqq_s8(int8x16_t __p0, int8x16_t __p1) {
   6636   uint8x16_t __ret;
   6637   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6638   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6639   __ret = (uint8x16_t)(__rev0 == __rev1);
   6640   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6641   return __ret;
   6642 }
   6643 #endif
   6644 
   6645 #ifdef __LITTLE_ENDIAN__
   6646 __ai __attribute__((target("neon"))) uint32x4_t vceqq_f32(float32x4_t __p0, float32x4_t __p1) {
   6647   uint32x4_t __ret;
   6648   __ret = (uint32x4_t)(__p0 == __p1);
   6649   return __ret;
   6650 }
   6651 #else
   6652 __ai __attribute__((target("neon"))) uint32x4_t vceqq_f32(float32x4_t __p0, float32x4_t __p1) {
   6653   uint32x4_t __ret;
   6654   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6655   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6656   __ret = (uint32x4_t)(__rev0 == __rev1);
   6657   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6658   return __ret;
   6659 }
   6660 #endif
   6661 
   6662 #ifdef __LITTLE_ENDIAN__
   6663 __ai __attribute__((target("neon"))) uint32x4_t vceqq_s32(int32x4_t __p0, int32x4_t __p1) {
   6664   uint32x4_t __ret;
   6665   __ret = (uint32x4_t)(__p0 == __p1);
   6666   return __ret;
   6667 }
   6668 #else
   6669 __ai __attribute__((target("neon"))) uint32x4_t vceqq_s32(int32x4_t __p0, int32x4_t __p1) {
   6670   uint32x4_t __ret;
   6671   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6672   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6673   __ret = (uint32x4_t)(__rev0 == __rev1);
   6674   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6675   return __ret;
   6676 }
   6677 #endif
   6678 
   6679 #ifdef __LITTLE_ENDIAN__
   6680 __ai __attribute__((target("neon"))) uint16x8_t vceqq_s16(int16x8_t __p0, int16x8_t __p1) {
   6681   uint16x8_t __ret;
   6682   __ret = (uint16x8_t)(__p0 == __p1);
   6683   return __ret;
   6684 }
   6685 #else
   6686 __ai __attribute__((target("neon"))) uint16x8_t vceqq_s16(int16x8_t __p0, int16x8_t __p1) {
   6687   uint16x8_t __ret;
   6688   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6689   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6690   __ret = (uint16x8_t)(__rev0 == __rev1);
   6691   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6692   return __ret;
   6693 }
   6694 #endif
   6695 
   6696 #ifdef __LITTLE_ENDIAN__
   6697 __ai __attribute__((target("neon"))) uint8x8_t vceq_u8(uint8x8_t __p0, uint8x8_t __p1) {
   6698   uint8x8_t __ret;
   6699   __ret = (uint8x8_t)(__p0 == __p1);
   6700   return __ret;
   6701 }
   6702 #else
   6703 __ai __attribute__((target("neon"))) uint8x8_t vceq_u8(uint8x8_t __p0, uint8x8_t __p1) {
   6704   uint8x8_t __ret;
   6705   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6706   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6707   __ret = (uint8x8_t)(__rev0 == __rev1);
   6708   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6709   return __ret;
   6710 }
   6711 #endif
   6712 
   6713 #ifdef __LITTLE_ENDIAN__
   6714 __ai __attribute__((target("neon"))) uint32x2_t vceq_u32(uint32x2_t __p0, uint32x2_t __p1) {
   6715   uint32x2_t __ret;
   6716   __ret = (uint32x2_t)(__p0 == __p1);
   6717   return __ret;
   6718 }
   6719 #else
   6720 __ai __attribute__((target("neon"))) uint32x2_t vceq_u32(uint32x2_t __p0, uint32x2_t __p1) {
   6721   uint32x2_t __ret;
   6722   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6723   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6724   __ret = (uint32x2_t)(__rev0 == __rev1);
   6725   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6726   return __ret;
   6727 }
   6728 #endif
   6729 
   6730 #ifdef __LITTLE_ENDIAN__
   6731 __ai __attribute__((target("neon"))) uint16x4_t vceq_u16(uint16x4_t __p0, uint16x4_t __p1) {
   6732   uint16x4_t __ret;
   6733   __ret = (uint16x4_t)(__p0 == __p1);
   6734   return __ret;
   6735 }
   6736 #else
   6737 __ai __attribute__((target("neon"))) uint16x4_t vceq_u16(uint16x4_t __p0, uint16x4_t __p1) {
   6738   uint16x4_t __ret;
   6739   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6740   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6741   __ret = (uint16x4_t)(__rev0 == __rev1);
   6742   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6743   return __ret;
   6744 }
   6745 #endif
   6746 
   6747 #ifdef __LITTLE_ENDIAN__
   6748 __ai __attribute__((target("neon"))) uint8x8_t vceq_s8(int8x8_t __p0, int8x8_t __p1) {
   6749   uint8x8_t __ret;
   6750   __ret = (uint8x8_t)(__p0 == __p1);
   6751   return __ret;
   6752 }
   6753 #else
   6754 __ai __attribute__((target("neon"))) uint8x8_t vceq_s8(int8x8_t __p0, int8x8_t __p1) {
   6755   uint8x8_t __ret;
   6756   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6757   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6758   __ret = (uint8x8_t)(__rev0 == __rev1);
   6759   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6760   return __ret;
   6761 }
   6762 #endif
   6763 
   6764 #ifdef __LITTLE_ENDIAN__
   6765 __ai __attribute__((target("neon"))) uint32x2_t vceq_f32(float32x2_t __p0, float32x2_t __p1) {
   6766   uint32x2_t __ret;
   6767   __ret = (uint32x2_t)(__p0 == __p1);
   6768   return __ret;
   6769 }
   6770 #else
   6771 __ai __attribute__((target("neon"))) uint32x2_t vceq_f32(float32x2_t __p0, float32x2_t __p1) {
   6772   uint32x2_t __ret;
   6773   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6774   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6775   __ret = (uint32x2_t)(__rev0 == __rev1);
   6776   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6777   return __ret;
   6778 }
   6779 #endif
   6780 
   6781 #ifdef __LITTLE_ENDIAN__
   6782 __ai __attribute__((target("neon"))) uint32x2_t vceq_s32(int32x2_t __p0, int32x2_t __p1) {
   6783   uint32x2_t __ret;
   6784   __ret = (uint32x2_t)(__p0 == __p1);
   6785   return __ret;
   6786 }
   6787 #else
   6788 __ai __attribute__((target("neon"))) uint32x2_t vceq_s32(int32x2_t __p0, int32x2_t __p1) {
   6789   uint32x2_t __ret;
   6790   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6791   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6792   __ret = (uint32x2_t)(__rev0 == __rev1);
   6793   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6794   return __ret;
   6795 }
   6796 #endif
   6797 
   6798 #ifdef __LITTLE_ENDIAN__
   6799 __ai __attribute__((target("neon"))) uint16x4_t vceq_s16(int16x4_t __p0, int16x4_t __p1) {
   6800   uint16x4_t __ret;
   6801   __ret = (uint16x4_t)(__p0 == __p1);
   6802   return __ret;
   6803 }
   6804 #else
   6805 __ai __attribute__((target("neon"))) uint16x4_t vceq_s16(int16x4_t __p0, int16x4_t __p1) {
   6806   uint16x4_t __ret;
   6807   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6808   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6809   __ret = (uint16x4_t)(__rev0 == __rev1);
   6810   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6811   return __ret;
   6812 }
   6813 #endif
   6814 
   6815 #ifdef __LITTLE_ENDIAN__
   6816 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   6817   uint8x16_t __ret;
   6818   __ret = (uint8x16_t)(__p0 >= __p1);
   6819   return __ret;
   6820 }
   6821 #else
   6822 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   6823   uint8x16_t __ret;
   6824   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6825   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6826   __ret = (uint8x16_t)(__rev0 >= __rev1);
   6827   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6828   return __ret;
   6829 }
   6830 #endif
   6831 
   6832 #ifdef __LITTLE_ENDIAN__
   6833 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   6834   uint32x4_t __ret;
   6835   __ret = (uint32x4_t)(__p0 >= __p1);
   6836   return __ret;
   6837 }
   6838 #else
   6839 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   6840   uint32x4_t __ret;
   6841   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6842   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6843   __ret = (uint32x4_t)(__rev0 >= __rev1);
   6844   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6845   return __ret;
   6846 }
   6847 #endif
   6848 
   6849 #ifdef __LITTLE_ENDIAN__
   6850 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   6851   uint16x8_t __ret;
   6852   __ret = (uint16x8_t)(__p0 >= __p1);
   6853   return __ret;
   6854 }
   6855 #else
   6856 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   6857   uint16x8_t __ret;
   6858   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6859   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6860   __ret = (uint16x8_t)(__rev0 >= __rev1);
   6861   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6862   return __ret;
   6863 }
   6864 #endif
   6865 
   6866 #ifdef __LITTLE_ENDIAN__
   6867 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_s8(int8x16_t __p0, int8x16_t __p1) {
   6868   uint8x16_t __ret;
   6869   __ret = (uint8x16_t)(__p0 >= __p1);
   6870   return __ret;
   6871 }
   6872 #else
   6873 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_s8(int8x16_t __p0, int8x16_t __p1) {
   6874   uint8x16_t __ret;
   6875   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6876   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6877   __ret = (uint8x16_t)(__rev0 >= __rev1);
   6878   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   6879   return __ret;
   6880 }
   6881 #endif
   6882 
   6883 #ifdef __LITTLE_ENDIAN__
   6884 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_f32(float32x4_t __p0, float32x4_t __p1) {
   6885   uint32x4_t __ret;
   6886   __ret = (uint32x4_t)(__p0 >= __p1);
   6887   return __ret;
   6888 }
   6889 #else
   6890 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_f32(float32x4_t __p0, float32x4_t __p1) {
   6891   uint32x4_t __ret;
   6892   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6893   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6894   __ret = (uint32x4_t)(__rev0 >= __rev1);
   6895   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6896   return __ret;
   6897 }
   6898 #endif
   6899 
   6900 #ifdef __LITTLE_ENDIAN__
   6901 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_s32(int32x4_t __p0, int32x4_t __p1) {
   6902   uint32x4_t __ret;
   6903   __ret = (uint32x4_t)(__p0 >= __p1);
   6904   return __ret;
   6905 }
   6906 #else
   6907 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_s32(int32x4_t __p0, int32x4_t __p1) {
   6908   uint32x4_t __ret;
   6909   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6910   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6911   __ret = (uint32x4_t)(__rev0 >= __rev1);
   6912   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6913   return __ret;
   6914 }
   6915 #endif
   6916 
   6917 #ifdef __LITTLE_ENDIAN__
   6918 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_s16(int16x8_t __p0, int16x8_t __p1) {
   6919   uint16x8_t __ret;
   6920   __ret = (uint16x8_t)(__p0 >= __p1);
   6921   return __ret;
   6922 }
   6923 #else
   6924 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_s16(int16x8_t __p0, int16x8_t __p1) {
   6925   uint16x8_t __ret;
   6926   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6927   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6928   __ret = (uint16x8_t)(__rev0 >= __rev1);
   6929   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6930   return __ret;
   6931 }
   6932 #endif
   6933 
   6934 #ifdef __LITTLE_ENDIAN__
   6935 __ai __attribute__((target("neon"))) uint8x8_t vcge_u8(uint8x8_t __p0, uint8x8_t __p1) {
   6936   uint8x8_t __ret;
   6937   __ret = (uint8x8_t)(__p0 >= __p1);
   6938   return __ret;
   6939 }
   6940 #else
   6941 __ai __attribute__((target("neon"))) uint8x8_t vcge_u8(uint8x8_t __p0, uint8x8_t __p1) {
   6942   uint8x8_t __ret;
   6943   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6944   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6945   __ret = (uint8x8_t)(__rev0 >= __rev1);
   6946   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6947   return __ret;
   6948 }
   6949 #endif
   6950 
   6951 #ifdef __LITTLE_ENDIAN__
   6952 __ai __attribute__((target("neon"))) uint32x2_t vcge_u32(uint32x2_t __p0, uint32x2_t __p1) {
   6953   uint32x2_t __ret;
   6954   __ret = (uint32x2_t)(__p0 >= __p1);
   6955   return __ret;
   6956 }
   6957 #else
   6958 __ai __attribute__((target("neon"))) uint32x2_t vcge_u32(uint32x2_t __p0, uint32x2_t __p1) {
   6959   uint32x2_t __ret;
   6960   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   6961   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   6962   __ret = (uint32x2_t)(__rev0 >= __rev1);
   6963   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   6964   return __ret;
   6965 }
   6966 #endif
   6967 
   6968 #ifdef __LITTLE_ENDIAN__
   6969 __ai __attribute__((target("neon"))) uint16x4_t vcge_u16(uint16x4_t __p0, uint16x4_t __p1) {
   6970   uint16x4_t __ret;
   6971   __ret = (uint16x4_t)(__p0 >= __p1);
   6972   return __ret;
   6973 }
   6974 #else
   6975 __ai __attribute__((target("neon"))) uint16x4_t vcge_u16(uint16x4_t __p0, uint16x4_t __p1) {
   6976   uint16x4_t __ret;
   6977   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   6978   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   6979   __ret = (uint16x4_t)(__rev0 >= __rev1);
   6980   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   6981   return __ret;
   6982 }
   6983 #endif
   6984 
   6985 #ifdef __LITTLE_ENDIAN__
   6986 __ai __attribute__((target("neon"))) uint8x8_t vcge_s8(int8x8_t __p0, int8x8_t __p1) {
   6987   uint8x8_t __ret;
   6988   __ret = (uint8x8_t)(__p0 >= __p1);
   6989   return __ret;
   6990 }
   6991 #else
   6992 __ai __attribute__((target("neon"))) uint8x8_t vcge_s8(int8x8_t __p0, int8x8_t __p1) {
   6993   uint8x8_t __ret;
   6994   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   6995   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   6996   __ret = (uint8x8_t)(__rev0 >= __rev1);
   6997   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   6998   return __ret;
   6999 }
   7000 #endif
   7001 
   7002 #ifdef __LITTLE_ENDIAN__
   7003 __ai __attribute__((target("neon"))) uint32x2_t vcge_f32(float32x2_t __p0, float32x2_t __p1) {
   7004   uint32x2_t __ret;
   7005   __ret = (uint32x2_t)(__p0 >= __p1);
   7006   return __ret;
   7007 }
   7008 #else
   7009 __ai __attribute__((target("neon"))) uint32x2_t vcge_f32(float32x2_t __p0, float32x2_t __p1) {
   7010   uint32x2_t __ret;
   7011   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7012   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7013   __ret = (uint32x2_t)(__rev0 >= __rev1);
   7014   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7015   return __ret;
   7016 }
   7017 #endif
   7018 
   7019 #ifdef __LITTLE_ENDIAN__
   7020 __ai __attribute__((target("neon"))) uint32x2_t vcge_s32(int32x2_t __p0, int32x2_t __p1) {
   7021   uint32x2_t __ret;
   7022   __ret = (uint32x2_t)(__p0 >= __p1);
   7023   return __ret;
   7024 }
   7025 #else
   7026 __ai __attribute__((target("neon"))) uint32x2_t vcge_s32(int32x2_t __p0, int32x2_t __p1) {
   7027   uint32x2_t __ret;
   7028   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7029   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7030   __ret = (uint32x2_t)(__rev0 >= __rev1);
   7031   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7032   return __ret;
   7033 }
   7034 #endif
   7035 
   7036 #ifdef __LITTLE_ENDIAN__
   7037 __ai __attribute__((target("neon"))) uint16x4_t vcge_s16(int16x4_t __p0, int16x4_t __p1) {
   7038   uint16x4_t __ret;
   7039   __ret = (uint16x4_t)(__p0 >= __p1);
   7040   return __ret;
   7041 }
   7042 #else
   7043 __ai __attribute__((target("neon"))) uint16x4_t vcge_s16(int16x4_t __p0, int16x4_t __p1) {
   7044   uint16x4_t __ret;
   7045   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7046   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7047   __ret = (uint16x4_t)(__rev0 >= __rev1);
   7048   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7049   return __ret;
   7050 }
   7051 #endif
   7052 
   7053 #ifdef __LITTLE_ENDIAN__
   7054 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   7055   uint8x16_t __ret;
   7056   __ret = (uint8x16_t)(__p0 > __p1);
   7057   return __ret;
   7058 }
   7059 #else
   7060 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   7061   uint8x16_t __ret;
   7062   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7063   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7064   __ret = (uint8x16_t)(__rev0 > __rev1);
   7065   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7066   return __ret;
   7067 }
   7068 #endif
   7069 
   7070 #ifdef __LITTLE_ENDIAN__
   7071 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   7072   uint32x4_t __ret;
   7073   __ret = (uint32x4_t)(__p0 > __p1);
   7074   return __ret;
   7075 }
   7076 #else
   7077 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   7078   uint32x4_t __ret;
   7079   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7080   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7081   __ret = (uint32x4_t)(__rev0 > __rev1);
   7082   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7083   return __ret;
   7084 }
   7085 #endif
   7086 
   7087 #ifdef __LITTLE_ENDIAN__
   7088 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   7089   uint16x8_t __ret;
   7090   __ret = (uint16x8_t)(__p0 > __p1);
   7091   return __ret;
   7092 }
   7093 #else
   7094 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   7095   uint16x8_t __ret;
   7096   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7097   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7098   __ret = (uint16x8_t)(__rev0 > __rev1);
   7099   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7100   return __ret;
   7101 }
   7102 #endif
   7103 
   7104 #ifdef __LITTLE_ENDIAN__
   7105 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_s8(int8x16_t __p0, int8x16_t __p1) {
   7106   uint8x16_t __ret;
   7107   __ret = (uint8x16_t)(__p0 > __p1);
   7108   return __ret;
   7109 }
   7110 #else
   7111 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_s8(int8x16_t __p0, int8x16_t __p1) {
   7112   uint8x16_t __ret;
   7113   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7114   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7115   __ret = (uint8x16_t)(__rev0 > __rev1);
   7116   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7117   return __ret;
   7118 }
   7119 #endif
   7120 
   7121 #ifdef __LITTLE_ENDIAN__
   7122 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_f32(float32x4_t __p0, float32x4_t __p1) {
   7123   uint32x4_t __ret;
   7124   __ret = (uint32x4_t)(__p0 > __p1);
   7125   return __ret;
   7126 }
   7127 #else
   7128 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_f32(float32x4_t __p0, float32x4_t __p1) {
   7129   uint32x4_t __ret;
   7130   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7131   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7132   __ret = (uint32x4_t)(__rev0 > __rev1);
   7133   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7134   return __ret;
   7135 }
   7136 #endif
   7137 
   7138 #ifdef __LITTLE_ENDIAN__
   7139 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_s32(int32x4_t __p0, int32x4_t __p1) {
   7140   uint32x4_t __ret;
   7141   __ret = (uint32x4_t)(__p0 > __p1);
   7142   return __ret;
   7143 }
   7144 #else
   7145 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_s32(int32x4_t __p0, int32x4_t __p1) {
   7146   uint32x4_t __ret;
   7147   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7148   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7149   __ret = (uint32x4_t)(__rev0 > __rev1);
   7150   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7151   return __ret;
   7152 }
   7153 #endif
   7154 
   7155 #ifdef __LITTLE_ENDIAN__
   7156 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_s16(int16x8_t __p0, int16x8_t __p1) {
   7157   uint16x8_t __ret;
   7158   __ret = (uint16x8_t)(__p0 > __p1);
   7159   return __ret;
   7160 }
   7161 #else
   7162 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_s16(int16x8_t __p0, int16x8_t __p1) {
   7163   uint16x8_t __ret;
   7164   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7165   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7166   __ret = (uint16x8_t)(__rev0 > __rev1);
   7167   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7168   return __ret;
   7169 }
   7170 #endif
   7171 
   7172 #ifdef __LITTLE_ENDIAN__
   7173 __ai __attribute__((target("neon"))) uint8x8_t vcgt_u8(uint8x8_t __p0, uint8x8_t __p1) {
   7174   uint8x8_t __ret;
   7175   __ret = (uint8x8_t)(__p0 > __p1);
   7176   return __ret;
   7177 }
   7178 #else
   7179 __ai __attribute__((target("neon"))) uint8x8_t vcgt_u8(uint8x8_t __p0, uint8x8_t __p1) {
   7180   uint8x8_t __ret;
   7181   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7182   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7183   __ret = (uint8x8_t)(__rev0 > __rev1);
   7184   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7185   return __ret;
   7186 }
   7187 #endif
   7188 
   7189 #ifdef __LITTLE_ENDIAN__
   7190 __ai __attribute__((target("neon"))) uint32x2_t vcgt_u32(uint32x2_t __p0, uint32x2_t __p1) {
   7191   uint32x2_t __ret;
   7192   __ret = (uint32x2_t)(__p0 > __p1);
   7193   return __ret;
   7194 }
   7195 #else
   7196 __ai __attribute__((target("neon"))) uint32x2_t vcgt_u32(uint32x2_t __p0, uint32x2_t __p1) {
   7197   uint32x2_t __ret;
   7198   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7199   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7200   __ret = (uint32x2_t)(__rev0 > __rev1);
   7201   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7202   return __ret;
   7203 }
   7204 #endif
   7205 
   7206 #ifdef __LITTLE_ENDIAN__
   7207 __ai __attribute__((target("neon"))) uint16x4_t vcgt_u16(uint16x4_t __p0, uint16x4_t __p1) {
   7208   uint16x4_t __ret;
   7209   __ret = (uint16x4_t)(__p0 > __p1);
   7210   return __ret;
   7211 }
   7212 #else
   7213 __ai __attribute__((target("neon"))) uint16x4_t vcgt_u16(uint16x4_t __p0, uint16x4_t __p1) {
   7214   uint16x4_t __ret;
   7215   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7216   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7217   __ret = (uint16x4_t)(__rev0 > __rev1);
   7218   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7219   return __ret;
   7220 }
   7221 #endif
   7222 
   7223 #ifdef __LITTLE_ENDIAN__
   7224 __ai __attribute__((target("neon"))) uint8x8_t vcgt_s8(int8x8_t __p0, int8x8_t __p1) {
   7225   uint8x8_t __ret;
   7226   __ret = (uint8x8_t)(__p0 > __p1);
   7227   return __ret;
   7228 }
   7229 #else
   7230 __ai __attribute__((target("neon"))) uint8x8_t vcgt_s8(int8x8_t __p0, int8x8_t __p1) {
   7231   uint8x8_t __ret;
   7232   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7233   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7234   __ret = (uint8x8_t)(__rev0 > __rev1);
   7235   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7236   return __ret;
   7237 }
   7238 #endif
   7239 
   7240 #ifdef __LITTLE_ENDIAN__
   7241 __ai __attribute__((target("neon"))) uint32x2_t vcgt_f32(float32x2_t __p0, float32x2_t __p1) {
   7242   uint32x2_t __ret;
   7243   __ret = (uint32x2_t)(__p0 > __p1);
   7244   return __ret;
   7245 }
   7246 #else
   7247 __ai __attribute__((target("neon"))) uint32x2_t vcgt_f32(float32x2_t __p0, float32x2_t __p1) {
   7248   uint32x2_t __ret;
   7249   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7250   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7251   __ret = (uint32x2_t)(__rev0 > __rev1);
   7252   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7253   return __ret;
   7254 }
   7255 #endif
   7256 
   7257 #ifdef __LITTLE_ENDIAN__
   7258 __ai __attribute__((target("neon"))) uint32x2_t vcgt_s32(int32x2_t __p0, int32x2_t __p1) {
   7259   uint32x2_t __ret;
   7260   __ret = (uint32x2_t)(__p0 > __p1);
   7261   return __ret;
   7262 }
   7263 #else
   7264 __ai __attribute__((target("neon"))) uint32x2_t vcgt_s32(int32x2_t __p0, int32x2_t __p1) {
   7265   uint32x2_t __ret;
   7266   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7267   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7268   __ret = (uint32x2_t)(__rev0 > __rev1);
   7269   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7270   return __ret;
   7271 }
   7272 #endif
   7273 
   7274 #ifdef __LITTLE_ENDIAN__
   7275 __ai __attribute__((target("neon"))) uint16x4_t vcgt_s16(int16x4_t __p0, int16x4_t __p1) {
   7276   uint16x4_t __ret;
   7277   __ret = (uint16x4_t)(__p0 > __p1);
   7278   return __ret;
   7279 }
   7280 #else
   7281 __ai __attribute__((target("neon"))) uint16x4_t vcgt_s16(int16x4_t __p0, int16x4_t __p1) {
   7282   uint16x4_t __ret;
   7283   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7284   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7285   __ret = (uint16x4_t)(__rev0 > __rev1);
   7286   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7287   return __ret;
   7288 }
   7289 #endif
   7290 
   7291 #ifdef __LITTLE_ENDIAN__
   7292 __ai __attribute__((target("neon"))) uint8x16_t vcleq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   7293   uint8x16_t __ret;
   7294   __ret = (uint8x16_t)(__p0 <= __p1);
   7295   return __ret;
   7296 }
   7297 #else
   7298 __ai __attribute__((target("neon"))) uint8x16_t vcleq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   7299   uint8x16_t __ret;
   7300   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7301   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7302   __ret = (uint8x16_t)(__rev0 <= __rev1);
   7303   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7304   return __ret;
   7305 }
   7306 #endif
   7307 
   7308 #ifdef __LITTLE_ENDIAN__
   7309 __ai __attribute__((target("neon"))) uint32x4_t vcleq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   7310   uint32x4_t __ret;
   7311   __ret = (uint32x4_t)(__p0 <= __p1);
   7312   return __ret;
   7313 }
   7314 #else
   7315 __ai __attribute__((target("neon"))) uint32x4_t vcleq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   7316   uint32x4_t __ret;
   7317   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7318   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7319   __ret = (uint32x4_t)(__rev0 <= __rev1);
   7320   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7321   return __ret;
   7322 }
   7323 #endif
   7324 
   7325 #ifdef __LITTLE_ENDIAN__
   7326 __ai __attribute__((target("neon"))) uint16x8_t vcleq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   7327   uint16x8_t __ret;
   7328   __ret = (uint16x8_t)(__p0 <= __p1);
   7329   return __ret;
   7330 }
   7331 #else
   7332 __ai __attribute__((target("neon"))) uint16x8_t vcleq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   7333   uint16x8_t __ret;
   7334   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7335   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7336   __ret = (uint16x8_t)(__rev0 <= __rev1);
   7337   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7338   return __ret;
   7339 }
   7340 #endif
   7341 
   7342 #ifdef __LITTLE_ENDIAN__
   7343 __ai __attribute__((target("neon"))) uint8x16_t vcleq_s8(int8x16_t __p0, int8x16_t __p1) {
   7344   uint8x16_t __ret;
   7345   __ret = (uint8x16_t)(__p0 <= __p1);
   7346   return __ret;
   7347 }
   7348 #else
   7349 __ai __attribute__((target("neon"))) uint8x16_t vcleq_s8(int8x16_t __p0, int8x16_t __p1) {
   7350   uint8x16_t __ret;
   7351   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7352   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7353   __ret = (uint8x16_t)(__rev0 <= __rev1);
   7354   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7355   return __ret;
   7356 }
   7357 #endif
   7358 
   7359 #ifdef __LITTLE_ENDIAN__
   7360 __ai __attribute__((target("neon"))) uint32x4_t vcleq_f32(float32x4_t __p0, float32x4_t __p1) {
   7361   uint32x4_t __ret;
   7362   __ret = (uint32x4_t)(__p0 <= __p1);
   7363   return __ret;
   7364 }
   7365 #else
   7366 __ai __attribute__((target("neon"))) uint32x4_t vcleq_f32(float32x4_t __p0, float32x4_t __p1) {
   7367   uint32x4_t __ret;
   7368   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7369   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7370   __ret = (uint32x4_t)(__rev0 <= __rev1);
   7371   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7372   return __ret;
   7373 }
   7374 #endif
   7375 
   7376 #ifdef __LITTLE_ENDIAN__
   7377 __ai __attribute__((target("neon"))) uint32x4_t vcleq_s32(int32x4_t __p0, int32x4_t __p1) {
   7378   uint32x4_t __ret;
   7379   __ret = (uint32x4_t)(__p0 <= __p1);
   7380   return __ret;
   7381 }
   7382 #else
   7383 __ai __attribute__((target("neon"))) uint32x4_t vcleq_s32(int32x4_t __p0, int32x4_t __p1) {
   7384   uint32x4_t __ret;
   7385   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7386   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7387   __ret = (uint32x4_t)(__rev0 <= __rev1);
   7388   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7389   return __ret;
   7390 }
   7391 #endif
   7392 
   7393 #ifdef __LITTLE_ENDIAN__
   7394 __ai __attribute__((target("neon"))) uint16x8_t vcleq_s16(int16x8_t __p0, int16x8_t __p1) {
   7395   uint16x8_t __ret;
   7396   __ret = (uint16x8_t)(__p0 <= __p1);
   7397   return __ret;
   7398 }
   7399 #else
   7400 __ai __attribute__((target("neon"))) uint16x8_t vcleq_s16(int16x8_t __p0, int16x8_t __p1) {
   7401   uint16x8_t __ret;
   7402   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7403   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7404   __ret = (uint16x8_t)(__rev0 <= __rev1);
   7405   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7406   return __ret;
   7407 }
   7408 #endif
   7409 
   7410 #ifdef __LITTLE_ENDIAN__
   7411 __ai __attribute__((target("neon"))) uint8x8_t vcle_u8(uint8x8_t __p0, uint8x8_t __p1) {
   7412   uint8x8_t __ret;
   7413   __ret = (uint8x8_t)(__p0 <= __p1);
   7414   return __ret;
   7415 }
   7416 #else
   7417 __ai __attribute__((target("neon"))) uint8x8_t vcle_u8(uint8x8_t __p0, uint8x8_t __p1) {
   7418   uint8x8_t __ret;
   7419   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7420   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7421   __ret = (uint8x8_t)(__rev0 <= __rev1);
   7422   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7423   return __ret;
   7424 }
   7425 #endif
   7426 
   7427 #ifdef __LITTLE_ENDIAN__
   7428 __ai __attribute__((target("neon"))) uint32x2_t vcle_u32(uint32x2_t __p0, uint32x2_t __p1) {
   7429   uint32x2_t __ret;
   7430   __ret = (uint32x2_t)(__p0 <= __p1);
   7431   return __ret;
   7432 }
   7433 #else
   7434 __ai __attribute__((target("neon"))) uint32x2_t vcle_u32(uint32x2_t __p0, uint32x2_t __p1) {
   7435   uint32x2_t __ret;
   7436   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7437   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7438   __ret = (uint32x2_t)(__rev0 <= __rev1);
   7439   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7440   return __ret;
   7441 }
   7442 #endif
   7443 
   7444 #ifdef __LITTLE_ENDIAN__
   7445 __ai __attribute__((target("neon"))) uint16x4_t vcle_u16(uint16x4_t __p0, uint16x4_t __p1) {
   7446   uint16x4_t __ret;
   7447   __ret = (uint16x4_t)(__p0 <= __p1);
   7448   return __ret;
   7449 }
   7450 #else
   7451 __ai __attribute__((target("neon"))) uint16x4_t vcle_u16(uint16x4_t __p0, uint16x4_t __p1) {
   7452   uint16x4_t __ret;
   7453   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7454   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7455   __ret = (uint16x4_t)(__rev0 <= __rev1);
   7456   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7457   return __ret;
   7458 }
   7459 #endif
   7460 
   7461 #ifdef __LITTLE_ENDIAN__
   7462 __ai __attribute__((target("neon"))) uint8x8_t vcle_s8(int8x8_t __p0, int8x8_t __p1) {
   7463   uint8x8_t __ret;
   7464   __ret = (uint8x8_t)(__p0 <= __p1);
   7465   return __ret;
   7466 }
   7467 #else
   7468 __ai __attribute__((target("neon"))) uint8x8_t vcle_s8(int8x8_t __p0, int8x8_t __p1) {
   7469   uint8x8_t __ret;
   7470   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7471   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7472   __ret = (uint8x8_t)(__rev0 <= __rev1);
   7473   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7474   return __ret;
   7475 }
   7476 #endif
   7477 
   7478 #ifdef __LITTLE_ENDIAN__
   7479 __ai __attribute__((target("neon"))) uint32x2_t vcle_f32(float32x2_t __p0, float32x2_t __p1) {
   7480   uint32x2_t __ret;
   7481   __ret = (uint32x2_t)(__p0 <= __p1);
   7482   return __ret;
   7483 }
   7484 #else
   7485 __ai __attribute__((target("neon"))) uint32x2_t vcle_f32(float32x2_t __p0, float32x2_t __p1) {
   7486   uint32x2_t __ret;
   7487   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7488   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7489   __ret = (uint32x2_t)(__rev0 <= __rev1);
   7490   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7491   return __ret;
   7492 }
   7493 #endif
   7494 
   7495 #ifdef __LITTLE_ENDIAN__
   7496 __ai __attribute__((target("neon"))) uint32x2_t vcle_s32(int32x2_t __p0, int32x2_t __p1) {
   7497   uint32x2_t __ret;
   7498   __ret = (uint32x2_t)(__p0 <= __p1);
   7499   return __ret;
   7500 }
   7501 #else
   7502 __ai __attribute__((target("neon"))) uint32x2_t vcle_s32(int32x2_t __p0, int32x2_t __p1) {
   7503   uint32x2_t __ret;
   7504   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7505   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7506   __ret = (uint32x2_t)(__rev0 <= __rev1);
   7507   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7508   return __ret;
   7509 }
   7510 #endif
   7511 
   7512 #ifdef __LITTLE_ENDIAN__
   7513 __ai __attribute__((target("neon"))) uint16x4_t vcle_s16(int16x4_t __p0, int16x4_t __p1) {
   7514   uint16x4_t __ret;
   7515   __ret = (uint16x4_t)(__p0 <= __p1);
   7516   return __ret;
   7517 }
   7518 #else
   7519 __ai __attribute__((target("neon"))) uint16x4_t vcle_s16(int16x4_t __p0, int16x4_t __p1) {
   7520   uint16x4_t __ret;
   7521   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7522   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7523   __ret = (uint16x4_t)(__rev0 <= __rev1);
   7524   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7525   return __ret;
   7526 }
   7527 #endif
   7528 
   7529 #ifdef __LITTLE_ENDIAN__
   7530 __ai __attribute__((target("neon"))) int8x16_t vclsq_u8(uint8x16_t __p0) {
   7531   int8x16_t __ret;
   7532   __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 32);
   7533   return __ret;
   7534 }
   7535 #else
   7536 __ai __attribute__((target("neon"))) int8x16_t vclsq_u8(uint8x16_t __p0) {
   7537   int8x16_t __ret;
   7538   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7539   __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 32);
   7540   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7541   return __ret;
   7542 }
   7543 #endif
   7544 
   7545 #ifdef __LITTLE_ENDIAN__
   7546 __ai __attribute__((target("neon"))) int32x4_t vclsq_u32(uint32x4_t __p0) {
   7547   int32x4_t __ret;
   7548   __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 34);
   7549   return __ret;
   7550 }
   7551 #else
   7552 __ai __attribute__((target("neon"))) int32x4_t vclsq_u32(uint32x4_t __p0) {
   7553   int32x4_t __ret;
   7554   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7555   __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 34);
   7556   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7557   return __ret;
   7558 }
   7559 #endif
   7560 
   7561 #ifdef __LITTLE_ENDIAN__
   7562 __ai __attribute__((target("neon"))) int16x8_t vclsq_u16(uint16x8_t __p0) {
   7563   int16x8_t __ret;
   7564   __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 33);
   7565   return __ret;
   7566 }
   7567 #else
   7568 __ai __attribute__((target("neon"))) int16x8_t vclsq_u16(uint16x8_t __p0) {
   7569   int16x8_t __ret;
   7570   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7571   __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 33);
   7572   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7573   return __ret;
   7574 }
   7575 #endif
   7576 
   7577 #ifdef __LITTLE_ENDIAN__
   7578 __ai __attribute__((target("neon"))) int8x16_t vclsq_s8(int8x16_t __p0) {
   7579   int8x16_t __ret;
   7580   __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 32);
   7581   return __ret;
   7582 }
   7583 #else
   7584 __ai __attribute__((target("neon"))) int8x16_t vclsq_s8(int8x16_t __p0) {
   7585   int8x16_t __ret;
   7586   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7587   __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 32);
   7588   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7589   return __ret;
   7590 }
   7591 #endif
   7592 
   7593 #ifdef __LITTLE_ENDIAN__
   7594 __ai __attribute__((target("neon"))) int32x4_t vclsq_s32(int32x4_t __p0) {
   7595   int32x4_t __ret;
   7596   __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 34);
   7597   return __ret;
   7598 }
   7599 #else
   7600 __ai __attribute__((target("neon"))) int32x4_t vclsq_s32(int32x4_t __p0) {
   7601   int32x4_t __ret;
   7602   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7603   __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 34);
   7604   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7605   return __ret;
   7606 }
   7607 #endif
   7608 
   7609 #ifdef __LITTLE_ENDIAN__
   7610 __ai __attribute__((target("neon"))) int16x8_t vclsq_s16(int16x8_t __p0) {
   7611   int16x8_t __ret;
   7612   __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 33);
   7613   return __ret;
   7614 }
   7615 #else
   7616 __ai __attribute__((target("neon"))) int16x8_t vclsq_s16(int16x8_t __p0) {
   7617   int16x8_t __ret;
   7618   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7619   __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 33);
   7620   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7621   return __ret;
   7622 }
   7623 #endif
   7624 
   7625 #ifdef __LITTLE_ENDIAN__
   7626 __ai __attribute__((target("neon"))) int8x8_t vcls_u8(uint8x8_t __p0) {
   7627   int8x8_t __ret;
   7628   __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__p0, 0);
   7629   return __ret;
   7630 }
   7631 #else
   7632 __ai __attribute__((target("neon"))) int8x8_t vcls_u8(uint8x8_t __p0) {
   7633   int8x8_t __ret;
   7634   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7635   __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 0);
   7636   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7637   return __ret;
   7638 }
   7639 #endif
   7640 
   7641 #ifdef __LITTLE_ENDIAN__
   7642 __ai __attribute__((target("neon"))) int32x2_t vcls_u32(uint32x2_t __p0) {
   7643   int32x2_t __ret;
   7644   __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__p0, 2);
   7645   return __ret;
   7646 }
   7647 #else
   7648 __ai __attribute__((target("neon"))) int32x2_t vcls_u32(uint32x2_t __p0) {
   7649   int32x2_t __ret;
   7650   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7651   __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 2);
   7652   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7653   return __ret;
   7654 }
   7655 #endif
   7656 
   7657 #ifdef __LITTLE_ENDIAN__
   7658 __ai __attribute__((target("neon"))) int16x4_t vcls_u16(uint16x4_t __p0) {
   7659   int16x4_t __ret;
   7660   __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__p0, 1);
   7661   return __ret;
   7662 }
   7663 #else
   7664 __ai __attribute__((target("neon"))) int16x4_t vcls_u16(uint16x4_t __p0) {
   7665   int16x4_t __ret;
   7666   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7667   __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 1);
   7668   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7669   return __ret;
   7670 }
   7671 #endif
   7672 
   7673 #ifdef __LITTLE_ENDIAN__
   7674 __ai __attribute__((target("neon"))) int8x8_t vcls_s8(int8x8_t __p0) {
   7675   int8x8_t __ret;
   7676   __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__p0, 0);
   7677   return __ret;
   7678 }
   7679 #else
   7680 __ai __attribute__((target("neon"))) int8x8_t vcls_s8(int8x8_t __p0) {
   7681   int8x8_t __ret;
   7682   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7683   __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 0);
   7684   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7685   return __ret;
   7686 }
   7687 #endif
   7688 
   7689 #ifdef __LITTLE_ENDIAN__
   7690 __ai __attribute__((target("neon"))) int32x2_t vcls_s32(int32x2_t __p0) {
   7691   int32x2_t __ret;
   7692   __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__p0, 2);
   7693   return __ret;
   7694 }
   7695 #else
   7696 __ai __attribute__((target("neon"))) int32x2_t vcls_s32(int32x2_t __p0) {
   7697   int32x2_t __ret;
   7698   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7699   __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 2);
   7700   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7701   return __ret;
   7702 }
   7703 #endif
   7704 
   7705 #ifdef __LITTLE_ENDIAN__
   7706 __ai __attribute__((target("neon"))) int16x4_t vcls_s16(int16x4_t __p0) {
   7707   int16x4_t __ret;
   7708   __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__p0, 1);
   7709   return __ret;
   7710 }
   7711 #else
   7712 __ai __attribute__((target("neon"))) int16x4_t vcls_s16(int16x4_t __p0) {
   7713   int16x4_t __ret;
   7714   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7715   __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 1);
   7716   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7717   return __ret;
   7718 }
   7719 #endif
   7720 
   7721 #ifdef __LITTLE_ENDIAN__
   7722 __ai __attribute__((target("neon"))) uint8x16_t vcltq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   7723   uint8x16_t __ret;
   7724   __ret = (uint8x16_t)(__p0 < __p1);
   7725   return __ret;
   7726 }
   7727 #else
   7728 __ai __attribute__((target("neon"))) uint8x16_t vcltq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   7729   uint8x16_t __ret;
   7730   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7731   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7732   __ret = (uint8x16_t)(__rev0 < __rev1);
   7733   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7734   return __ret;
   7735 }
   7736 #endif
   7737 
   7738 #ifdef __LITTLE_ENDIAN__
   7739 __ai __attribute__((target("neon"))) uint32x4_t vcltq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   7740   uint32x4_t __ret;
   7741   __ret = (uint32x4_t)(__p0 < __p1);
   7742   return __ret;
   7743 }
   7744 #else
   7745 __ai __attribute__((target("neon"))) uint32x4_t vcltq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   7746   uint32x4_t __ret;
   7747   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7748   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7749   __ret = (uint32x4_t)(__rev0 < __rev1);
   7750   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7751   return __ret;
   7752 }
   7753 #endif
   7754 
   7755 #ifdef __LITTLE_ENDIAN__
   7756 __ai __attribute__((target("neon"))) uint16x8_t vcltq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   7757   uint16x8_t __ret;
   7758   __ret = (uint16x8_t)(__p0 < __p1);
   7759   return __ret;
   7760 }
   7761 #else
   7762 __ai __attribute__((target("neon"))) uint16x8_t vcltq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   7763   uint16x8_t __ret;
   7764   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7765   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7766   __ret = (uint16x8_t)(__rev0 < __rev1);
   7767   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7768   return __ret;
   7769 }
   7770 #endif
   7771 
   7772 #ifdef __LITTLE_ENDIAN__
   7773 __ai __attribute__((target("neon"))) uint8x16_t vcltq_s8(int8x16_t __p0, int8x16_t __p1) {
   7774   uint8x16_t __ret;
   7775   __ret = (uint8x16_t)(__p0 < __p1);
   7776   return __ret;
   7777 }
   7778 #else
   7779 __ai __attribute__((target("neon"))) uint8x16_t vcltq_s8(int8x16_t __p0, int8x16_t __p1) {
   7780   uint8x16_t __ret;
   7781   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7782   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7783   __ret = (uint8x16_t)(__rev0 < __rev1);
   7784   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7785   return __ret;
   7786 }
   7787 #endif
   7788 
   7789 #ifdef __LITTLE_ENDIAN__
   7790 __ai __attribute__((target("neon"))) uint32x4_t vcltq_f32(float32x4_t __p0, float32x4_t __p1) {
   7791   uint32x4_t __ret;
   7792   __ret = (uint32x4_t)(__p0 < __p1);
   7793   return __ret;
   7794 }
   7795 #else
   7796 __ai __attribute__((target("neon"))) uint32x4_t vcltq_f32(float32x4_t __p0, float32x4_t __p1) {
   7797   uint32x4_t __ret;
   7798   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7799   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7800   __ret = (uint32x4_t)(__rev0 < __rev1);
   7801   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7802   return __ret;
   7803 }
   7804 #endif
   7805 
   7806 #ifdef __LITTLE_ENDIAN__
   7807 __ai __attribute__((target("neon"))) uint32x4_t vcltq_s32(int32x4_t __p0, int32x4_t __p1) {
   7808   uint32x4_t __ret;
   7809   __ret = (uint32x4_t)(__p0 < __p1);
   7810   return __ret;
   7811 }
   7812 #else
   7813 __ai __attribute__((target("neon"))) uint32x4_t vcltq_s32(int32x4_t __p0, int32x4_t __p1) {
   7814   uint32x4_t __ret;
   7815   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7816   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7817   __ret = (uint32x4_t)(__rev0 < __rev1);
   7818   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7819   return __ret;
   7820 }
   7821 #endif
   7822 
   7823 #ifdef __LITTLE_ENDIAN__
   7824 __ai __attribute__((target("neon"))) uint16x8_t vcltq_s16(int16x8_t __p0, int16x8_t __p1) {
   7825   uint16x8_t __ret;
   7826   __ret = (uint16x8_t)(__p0 < __p1);
   7827   return __ret;
   7828 }
   7829 #else
   7830 __ai __attribute__((target("neon"))) uint16x8_t vcltq_s16(int16x8_t __p0, int16x8_t __p1) {
   7831   uint16x8_t __ret;
   7832   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7833   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7834   __ret = (uint16x8_t)(__rev0 < __rev1);
   7835   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7836   return __ret;
   7837 }
   7838 #endif
   7839 
   7840 #ifdef __LITTLE_ENDIAN__
   7841 __ai __attribute__((target("neon"))) uint8x8_t vclt_u8(uint8x8_t __p0, uint8x8_t __p1) {
   7842   uint8x8_t __ret;
   7843   __ret = (uint8x8_t)(__p0 < __p1);
   7844   return __ret;
   7845 }
   7846 #else
   7847 __ai __attribute__((target("neon"))) uint8x8_t vclt_u8(uint8x8_t __p0, uint8x8_t __p1) {
   7848   uint8x8_t __ret;
   7849   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7850   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7851   __ret = (uint8x8_t)(__rev0 < __rev1);
   7852   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7853   return __ret;
   7854 }
   7855 #endif
   7856 
   7857 #ifdef __LITTLE_ENDIAN__
   7858 __ai __attribute__((target("neon"))) uint32x2_t vclt_u32(uint32x2_t __p0, uint32x2_t __p1) {
   7859   uint32x2_t __ret;
   7860   __ret = (uint32x2_t)(__p0 < __p1);
   7861   return __ret;
   7862 }
   7863 #else
   7864 __ai __attribute__((target("neon"))) uint32x2_t vclt_u32(uint32x2_t __p0, uint32x2_t __p1) {
   7865   uint32x2_t __ret;
   7866   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7867   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7868   __ret = (uint32x2_t)(__rev0 < __rev1);
   7869   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7870   return __ret;
   7871 }
   7872 #endif
   7873 
   7874 #ifdef __LITTLE_ENDIAN__
   7875 __ai __attribute__((target("neon"))) uint16x4_t vclt_u16(uint16x4_t __p0, uint16x4_t __p1) {
   7876   uint16x4_t __ret;
   7877   __ret = (uint16x4_t)(__p0 < __p1);
   7878   return __ret;
   7879 }
   7880 #else
   7881 __ai __attribute__((target("neon"))) uint16x4_t vclt_u16(uint16x4_t __p0, uint16x4_t __p1) {
   7882   uint16x4_t __ret;
   7883   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7884   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7885   __ret = (uint16x4_t)(__rev0 < __rev1);
   7886   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7887   return __ret;
   7888 }
   7889 #endif
   7890 
   7891 #ifdef __LITTLE_ENDIAN__
   7892 __ai __attribute__((target("neon"))) uint8x8_t vclt_s8(int8x8_t __p0, int8x8_t __p1) {
   7893   uint8x8_t __ret;
   7894   __ret = (uint8x8_t)(__p0 < __p1);
   7895   return __ret;
   7896 }
   7897 #else
   7898 __ai __attribute__((target("neon"))) uint8x8_t vclt_s8(int8x8_t __p0, int8x8_t __p1) {
   7899   uint8x8_t __ret;
   7900   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   7901   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   7902   __ret = (uint8x8_t)(__rev0 < __rev1);
   7903   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   7904   return __ret;
   7905 }
   7906 #endif
   7907 
   7908 #ifdef __LITTLE_ENDIAN__
   7909 __ai __attribute__((target("neon"))) uint32x2_t vclt_f32(float32x2_t __p0, float32x2_t __p1) {
   7910   uint32x2_t __ret;
   7911   __ret = (uint32x2_t)(__p0 < __p1);
   7912   return __ret;
   7913 }
   7914 #else
   7915 __ai __attribute__((target("neon"))) uint32x2_t vclt_f32(float32x2_t __p0, float32x2_t __p1) {
   7916   uint32x2_t __ret;
   7917   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7918   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7919   __ret = (uint32x2_t)(__rev0 < __rev1);
   7920   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7921   return __ret;
   7922 }
   7923 #endif
   7924 
   7925 #ifdef __LITTLE_ENDIAN__
   7926 __ai __attribute__((target("neon"))) uint32x2_t vclt_s32(int32x2_t __p0, int32x2_t __p1) {
   7927   uint32x2_t __ret;
   7928   __ret = (uint32x2_t)(__p0 < __p1);
   7929   return __ret;
   7930 }
   7931 #else
   7932 __ai __attribute__((target("neon"))) uint32x2_t vclt_s32(int32x2_t __p0, int32x2_t __p1) {
   7933   uint32x2_t __ret;
   7934   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   7935   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   7936   __ret = (uint32x2_t)(__rev0 < __rev1);
   7937   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   7938   return __ret;
   7939 }
   7940 #endif
   7941 
   7942 #ifdef __LITTLE_ENDIAN__
   7943 __ai __attribute__((target("neon"))) uint16x4_t vclt_s16(int16x4_t __p0, int16x4_t __p1) {
   7944   uint16x4_t __ret;
   7945   __ret = (uint16x4_t)(__p0 < __p1);
   7946   return __ret;
   7947 }
   7948 #else
   7949 __ai __attribute__((target("neon"))) uint16x4_t vclt_s16(int16x4_t __p0, int16x4_t __p1) {
   7950   uint16x4_t __ret;
   7951   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7952   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   7953   __ret = (uint16x4_t)(__rev0 < __rev1);
   7954   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7955   return __ret;
   7956 }
   7957 #endif
   7958 
   7959 #ifdef __LITTLE_ENDIAN__
   7960 __ai __attribute__((target("neon"))) uint8x16_t vclzq_u8(uint8x16_t __p0) {
   7961   uint8x16_t __ret;
   7962   __ret = (uint8x16_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 48);
   7963   return __ret;
   7964 }
   7965 #else
   7966 __ai __attribute__((target("neon"))) uint8x16_t vclzq_u8(uint8x16_t __p0) {
   7967   uint8x16_t __ret;
   7968   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7969   __ret = (uint8x16_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 48);
   7970   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   7971   return __ret;
   7972 }
   7973 #endif
   7974 
   7975 #ifdef __LITTLE_ENDIAN__
   7976 __ai __attribute__((target("neon"))) uint32x4_t vclzq_u32(uint32x4_t __p0) {
   7977   uint32x4_t __ret;
   7978   __ret = (uint32x4_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 50);
   7979   return __ret;
   7980 }
   7981 #else
   7982 __ai __attribute__((target("neon"))) uint32x4_t vclzq_u32(uint32x4_t __p0) {
   7983   uint32x4_t __ret;
   7984   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   7985   __ret = (uint32x4_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 50);
   7986   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   7987   return __ret;
   7988 }
   7989 #endif
   7990 
   7991 #ifdef __LITTLE_ENDIAN__
   7992 __ai __attribute__((target("neon"))) uint16x8_t vclzq_u16(uint16x8_t __p0) {
   7993   uint16x8_t __ret;
   7994   __ret = (uint16x8_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 49);
   7995   return __ret;
   7996 }
   7997 #else
   7998 __ai __attribute__((target("neon"))) uint16x8_t vclzq_u16(uint16x8_t __p0) {
   7999   uint16x8_t __ret;
   8000   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8001   __ret = (uint16x8_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 49);
   8002   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8003   return __ret;
   8004 }
   8005 #endif
   8006 
   8007 #ifdef __LITTLE_ENDIAN__
   8008 __ai __attribute__((target("neon"))) int8x16_t vclzq_s8(int8x16_t __p0) {
   8009   int8x16_t __ret;
   8010   __ret = (int8x16_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 32);
   8011   return __ret;
   8012 }
   8013 #else
   8014 __ai __attribute__((target("neon"))) int8x16_t vclzq_s8(int8x16_t __p0) {
   8015   int8x16_t __ret;
   8016   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8017   __ret = (int8x16_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 32);
   8018   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8019   return __ret;
   8020 }
   8021 #endif
   8022 
   8023 #ifdef __LITTLE_ENDIAN__
   8024 __ai __attribute__((target("neon"))) int32x4_t vclzq_s32(int32x4_t __p0) {
   8025   int32x4_t __ret;
   8026   __ret = (int32x4_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 34);
   8027   return __ret;
   8028 }
   8029 #else
   8030 __ai __attribute__((target("neon"))) int32x4_t vclzq_s32(int32x4_t __p0) {
   8031   int32x4_t __ret;
   8032   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8033   __ret = (int32x4_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 34);
   8034   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8035   return __ret;
   8036 }
   8037 #endif
   8038 
   8039 #ifdef __LITTLE_ENDIAN__
   8040 __ai __attribute__((target("neon"))) int16x8_t vclzq_s16(int16x8_t __p0) {
   8041   int16x8_t __ret;
   8042   __ret = (int16x8_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 33);
   8043   return __ret;
   8044 }
   8045 #else
   8046 __ai __attribute__((target("neon"))) int16x8_t vclzq_s16(int16x8_t __p0) {
   8047   int16x8_t __ret;
   8048   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8049   __ret = (int16x8_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 33);
   8050   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8051   return __ret;
   8052 }
   8053 #endif
   8054 
   8055 #ifdef __LITTLE_ENDIAN__
   8056 __ai __attribute__((target("neon"))) uint8x8_t vclz_u8(uint8x8_t __p0) {
   8057   uint8x8_t __ret;
   8058   __ret = (uint8x8_t) __builtin_neon_vclz_v((int8x8_t)__p0, 16);
   8059   return __ret;
   8060 }
   8061 #else
   8062 __ai __attribute__((target("neon"))) uint8x8_t vclz_u8(uint8x8_t __p0) {
   8063   uint8x8_t __ret;
   8064   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8065   __ret = (uint8x8_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 16);
   8066   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8067   return __ret;
   8068 }
   8069 #endif
   8070 
   8071 #ifdef __LITTLE_ENDIAN__
   8072 __ai __attribute__((target("neon"))) uint32x2_t vclz_u32(uint32x2_t __p0) {
   8073   uint32x2_t __ret;
   8074   __ret = (uint32x2_t) __builtin_neon_vclz_v((int8x8_t)__p0, 18);
   8075   return __ret;
   8076 }
   8077 #else
   8078 __ai __attribute__((target("neon"))) uint32x2_t vclz_u32(uint32x2_t __p0) {
   8079   uint32x2_t __ret;
   8080   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8081   __ret = (uint32x2_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 18);
   8082   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8083   return __ret;
   8084 }
   8085 #endif
   8086 
   8087 #ifdef __LITTLE_ENDIAN__
   8088 __ai __attribute__((target("neon"))) uint16x4_t vclz_u16(uint16x4_t __p0) {
   8089   uint16x4_t __ret;
   8090   __ret = (uint16x4_t) __builtin_neon_vclz_v((int8x8_t)__p0, 17);
   8091   return __ret;
   8092 }
   8093 #else
   8094 __ai __attribute__((target("neon"))) uint16x4_t vclz_u16(uint16x4_t __p0) {
   8095   uint16x4_t __ret;
   8096   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8097   __ret = (uint16x4_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 17);
   8098   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8099   return __ret;
   8100 }
   8101 #endif
   8102 
   8103 #ifdef __LITTLE_ENDIAN__
   8104 __ai __attribute__((target("neon"))) int8x8_t vclz_s8(int8x8_t __p0) {
   8105   int8x8_t __ret;
   8106   __ret = (int8x8_t) __builtin_neon_vclz_v((int8x8_t)__p0, 0);
   8107   return __ret;
   8108 }
   8109 #else
   8110 __ai __attribute__((target("neon"))) int8x8_t vclz_s8(int8x8_t __p0) {
   8111   int8x8_t __ret;
   8112   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8113   __ret = (int8x8_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 0);
   8114   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8115   return __ret;
   8116 }
   8117 #endif
   8118 
   8119 #ifdef __LITTLE_ENDIAN__
   8120 __ai __attribute__((target("neon"))) int32x2_t vclz_s32(int32x2_t __p0) {
   8121   int32x2_t __ret;
   8122   __ret = (int32x2_t) __builtin_neon_vclz_v((int8x8_t)__p0, 2);
   8123   return __ret;
   8124 }
   8125 #else
   8126 __ai __attribute__((target("neon"))) int32x2_t vclz_s32(int32x2_t __p0) {
   8127   int32x2_t __ret;
   8128   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8129   __ret = (int32x2_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 2);
   8130   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8131   return __ret;
   8132 }
   8133 #endif
   8134 
   8135 #ifdef __LITTLE_ENDIAN__
   8136 __ai __attribute__((target("neon"))) int16x4_t vclz_s16(int16x4_t __p0) {
   8137   int16x4_t __ret;
   8138   __ret = (int16x4_t) __builtin_neon_vclz_v((int8x8_t)__p0, 1);
   8139   return __ret;
   8140 }
   8141 #else
   8142 __ai __attribute__((target("neon"))) int16x4_t vclz_s16(int16x4_t __p0) {
   8143   int16x4_t __ret;
   8144   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8145   __ret = (int16x4_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 1);
   8146   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8147   return __ret;
   8148 }
   8149 #endif
   8150 
   8151 #ifdef __LITTLE_ENDIAN__
   8152 __ai __attribute__((target("neon"))) poly8x8_t vcnt_p8(poly8x8_t __p0) {
   8153   poly8x8_t __ret;
   8154   __ret = (poly8x8_t) __builtin_neon_vcnt_v((int8x8_t)__p0, 4);
   8155   return __ret;
   8156 }
   8157 #else
   8158 __ai __attribute__((target("neon"))) poly8x8_t vcnt_p8(poly8x8_t __p0) {
   8159   poly8x8_t __ret;
   8160   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8161   __ret = (poly8x8_t) __builtin_neon_vcnt_v((int8x8_t)__rev0, 4);
   8162   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8163   return __ret;
   8164 }
   8165 #endif
   8166 
   8167 #ifdef __LITTLE_ENDIAN__
   8168 __ai __attribute__((target("neon"))) poly8x16_t vcntq_p8(poly8x16_t __p0) {
   8169   poly8x16_t __ret;
   8170   __ret = (poly8x16_t) __builtin_neon_vcntq_v((int8x16_t)__p0, 36);
   8171   return __ret;
   8172 }
   8173 #else
   8174 __ai __attribute__((target("neon"))) poly8x16_t vcntq_p8(poly8x16_t __p0) {
   8175   poly8x16_t __ret;
   8176   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8177   __ret = (poly8x16_t) __builtin_neon_vcntq_v((int8x16_t)__rev0, 36);
   8178   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8179   return __ret;
   8180 }
   8181 #endif
   8182 
   8183 #ifdef __LITTLE_ENDIAN__
   8184 __ai __attribute__((target("neon"))) uint8x16_t vcntq_u8(uint8x16_t __p0) {
   8185   uint8x16_t __ret;
   8186   __ret = (uint8x16_t) __builtin_neon_vcntq_v((int8x16_t)__p0, 48);
   8187   return __ret;
   8188 }
   8189 #else
   8190 __ai __attribute__((target("neon"))) uint8x16_t vcntq_u8(uint8x16_t __p0) {
   8191   uint8x16_t __ret;
   8192   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8193   __ret = (uint8x16_t) __builtin_neon_vcntq_v((int8x16_t)__rev0, 48);
   8194   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8195   return __ret;
   8196 }
   8197 #endif
   8198 
   8199 #ifdef __LITTLE_ENDIAN__
   8200 __ai __attribute__((target("neon"))) int8x16_t vcntq_s8(int8x16_t __p0) {
   8201   int8x16_t __ret;
   8202   __ret = (int8x16_t) __builtin_neon_vcntq_v((int8x16_t)__p0, 32);
   8203   return __ret;
   8204 }
   8205 #else
   8206 __ai __attribute__((target("neon"))) int8x16_t vcntq_s8(int8x16_t __p0) {
   8207   int8x16_t __ret;
   8208   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8209   __ret = (int8x16_t) __builtin_neon_vcntq_v((int8x16_t)__rev0, 32);
   8210   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8211   return __ret;
   8212 }
   8213 #endif
   8214 
   8215 #ifdef __LITTLE_ENDIAN__
   8216 __ai __attribute__((target("neon"))) uint8x8_t vcnt_u8(uint8x8_t __p0) {
   8217   uint8x8_t __ret;
   8218   __ret = (uint8x8_t) __builtin_neon_vcnt_v((int8x8_t)__p0, 16);
   8219   return __ret;
   8220 }
   8221 #else
   8222 __ai __attribute__((target("neon"))) uint8x8_t vcnt_u8(uint8x8_t __p0) {
   8223   uint8x8_t __ret;
   8224   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8225   __ret = (uint8x8_t) __builtin_neon_vcnt_v((int8x8_t)__rev0, 16);
   8226   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8227   return __ret;
   8228 }
   8229 #endif
   8230 
   8231 #ifdef __LITTLE_ENDIAN__
   8232 __ai __attribute__((target("neon"))) int8x8_t vcnt_s8(int8x8_t __p0) {
   8233   int8x8_t __ret;
   8234   __ret = (int8x8_t) __builtin_neon_vcnt_v((int8x8_t)__p0, 0);
   8235   return __ret;
   8236 }
   8237 #else
   8238 __ai __attribute__((target("neon"))) int8x8_t vcnt_s8(int8x8_t __p0) {
   8239   int8x8_t __ret;
   8240   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8241   __ret = (int8x8_t) __builtin_neon_vcnt_v((int8x8_t)__rev0, 0);
   8242   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8243   return __ret;
   8244 }
   8245 #endif
   8246 
   8247 #ifdef __LITTLE_ENDIAN__
   8248 __ai __attribute__((target("neon"))) poly8x16_t vcombine_p8(poly8x8_t __p0, poly8x8_t __p1) {
   8249   poly8x16_t __ret;
   8250   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8251   return __ret;
   8252 }
   8253 #else
   8254 __ai __attribute__((target("neon"))) poly8x16_t vcombine_p8(poly8x8_t __p0, poly8x8_t __p1) {
   8255   poly8x16_t __ret;
   8256   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8257   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   8258   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8259   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8260   return __ret;
   8261 }
   8262 #endif
   8263 
   8264 #ifdef __LITTLE_ENDIAN__
   8265 __ai __attribute__((target("neon"))) poly16x8_t vcombine_p16(poly16x4_t __p0, poly16x4_t __p1) {
   8266   poly16x8_t __ret;
   8267   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8268   return __ret;
   8269 }
   8270 #else
   8271 __ai __attribute__((target("neon"))) poly16x8_t vcombine_p16(poly16x4_t __p0, poly16x4_t __p1) {
   8272   poly16x8_t __ret;
   8273   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8274   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   8275   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7);
   8276   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8277   return __ret;
   8278 }
   8279 #endif
   8280 
   8281 #ifdef __LITTLE_ENDIAN__
   8282 __ai __attribute__((target("neon"))) uint8x16_t vcombine_u8(uint8x8_t __p0, uint8x8_t __p1) {
   8283   uint8x16_t __ret;
   8284   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8285   return __ret;
   8286 }
   8287 #else
   8288 __ai __attribute__((target("neon"))) uint8x16_t vcombine_u8(uint8x8_t __p0, uint8x8_t __p1) {
   8289   uint8x16_t __ret;
   8290   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8291   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   8292   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8293   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8294   return __ret;
   8295 }
   8296 __ai __attribute__((target("neon"))) uint8x16_t __noswap_vcombine_u8(uint8x8_t __p0, uint8x8_t __p1) {
   8297   uint8x16_t __ret;
   8298   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8299   return __ret;
   8300 }
   8301 #endif
   8302 
   8303 #ifdef __LITTLE_ENDIAN__
   8304 __ai __attribute__((target("neon"))) uint32x4_t vcombine_u32(uint32x2_t __p0, uint32x2_t __p1) {
   8305   uint32x4_t __ret;
   8306   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3);
   8307   return __ret;
   8308 }
   8309 #else
   8310 __ai __attribute__((target("neon"))) uint32x4_t vcombine_u32(uint32x2_t __p0, uint32x2_t __p1) {
   8311   uint32x4_t __ret;
   8312   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8313   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   8314   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3);
   8315   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8316   return __ret;
   8317 }
   8318 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vcombine_u32(uint32x2_t __p0, uint32x2_t __p1) {
   8319   uint32x4_t __ret;
   8320   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3);
   8321   return __ret;
   8322 }
   8323 #endif
   8324 
   8325 #ifdef __LITTLE_ENDIAN__
   8326 __ai __attribute__((target("neon"))) uint64x2_t vcombine_u64(uint64x1_t __p0, uint64x1_t __p1) {
   8327   uint64x2_t __ret;
   8328   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
   8329   return __ret;
   8330 }
   8331 #else
   8332 __ai __attribute__((target("neon"))) uint64x2_t vcombine_u64(uint64x1_t __p0, uint64x1_t __p1) {
   8333   uint64x2_t __ret;
   8334   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
   8335   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8336   return __ret;
   8337 }
   8338 #endif
   8339 
   8340 #ifdef __LITTLE_ENDIAN__
   8341 __ai __attribute__((target("neon"))) uint16x8_t vcombine_u16(uint16x4_t __p0, uint16x4_t __p1) {
   8342   uint16x8_t __ret;
   8343   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8344   return __ret;
   8345 }
   8346 #else
   8347 __ai __attribute__((target("neon"))) uint16x8_t vcombine_u16(uint16x4_t __p0, uint16x4_t __p1) {
   8348   uint16x8_t __ret;
   8349   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8350   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   8351   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7);
   8352   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8353   return __ret;
   8354 }
   8355 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vcombine_u16(uint16x4_t __p0, uint16x4_t __p1) {
   8356   uint16x8_t __ret;
   8357   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8358   return __ret;
   8359 }
   8360 #endif
   8361 
   8362 #ifdef __LITTLE_ENDIAN__
   8363 __ai __attribute__((target("neon"))) int8x16_t vcombine_s8(int8x8_t __p0, int8x8_t __p1) {
   8364   int8x16_t __ret;
   8365   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8366   return __ret;
   8367 }
   8368 #else
   8369 __ai __attribute__((target("neon"))) int8x16_t vcombine_s8(int8x8_t __p0, int8x8_t __p1) {
   8370   int8x16_t __ret;
   8371   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   8372   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   8373   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8374   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   8375   return __ret;
   8376 }
   8377 __ai __attribute__((target("neon"))) int8x16_t __noswap_vcombine_s8(int8x8_t __p0, int8x8_t __p1) {
   8378   int8x16_t __ret;
   8379   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15);
   8380   return __ret;
   8381 }
   8382 #endif
   8383 
   8384 #ifdef __LITTLE_ENDIAN__
   8385 __ai __attribute__((target("neon"))) float32x4_t vcombine_f32(float32x2_t __p0, float32x2_t __p1) {
   8386   float32x4_t __ret;
   8387   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3);
   8388   return __ret;
   8389 }
   8390 #else
   8391 __ai __attribute__((target("neon"))) float32x4_t vcombine_f32(float32x2_t __p0, float32x2_t __p1) {
   8392   float32x4_t __ret;
   8393   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8394   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   8395   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3);
   8396   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8397   return __ret;
   8398 }
   8399 __ai __attribute__((target("neon"))) float32x4_t __noswap_vcombine_f32(float32x2_t __p0, float32x2_t __p1) {
   8400   float32x4_t __ret;
   8401   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3);
   8402   return __ret;
   8403 }
   8404 #endif
   8405 
   8406 #ifdef __LITTLE_ENDIAN__
   8407 __ai __attribute__((target("neon"))) float16x8_t vcombine_f16(float16x4_t __p0, float16x4_t __p1) {
   8408   float16x8_t __ret;
   8409   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8410   return __ret;
   8411 }
   8412 #else
   8413 __ai __attribute__((target("neon"))) float16x8_t vcombine_f16(float16x4_t __p0, float16x4_t __p1) {
   8414   float16x8_t __ret;
   8415   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8416   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   8417   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7);
   8418   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8419   return __ret;
   8420 }
   8421 __ai __attribute__((target("neon"))) float16x8_t __noswap_vcombine_f16(float16x4_t __p0, float16x4_t __p1) {
   8422   float16x8_t __ret;
   8423   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8424   return __ret;
   8425 }
   8426 #endif
   8427 
   8428 #ifdef __LITTLE_ENDIAN__
   8429 __ai __attribute__((target("neon"))) int32x4_t vcombine_s32(int32x2_t __p0, int32x2_t __p1) {
   8430   int32x4_t __ret;
   8431   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3);
   8432   return __ret;
   8433 }
   8434 #else
   8435 __ai __attribute__((target("neon"))) int32x4_t vcombine_s32(int32x2_t __p0, int32x2_t __p1) {
   8436   int32x4_t __ret;
   8437   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8438   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   8439   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3);
   8440   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8441   return __ret;
   8442 }
   8443 __ai __attribute__((target("neon"))) int32x4_t __noswap_vcombine_s32(int32x2_t __p0, int32x2_t __p1) {
   8444   int32x4_t __ret;
   8445   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3);
   8446   return __ret;
   8447 }
   8448 #endif
   8449 
   8450 #ifdef __LITTLE_ENDIAN__
   8451 __ai __attribute__((target("neon"))) int64x2_t vcombine_s64(int64x1_t __p0, int64x1_t __p1) {
   8452   int64x2_t __ret;
   8453   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
   8454   return __ret;
   8455 }
   8456 #else
   8457 __ai __attribute__((target("neon"))) int64x2_t vcombine_s64(int64x1_t __p0, int64x1_t __p1) {
   8458   int64x2_t __ret;
   8459   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
   8460   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8461   return __ret;
   8462 }
   8463 #endif
   8464 
   8465 #ifdef __LITTLE_ENDIAN__
   8466 __ai __attribute__((target("neon"))) int16x8_t vcombine_s16(int16x4_t __p0, int16x4_t __p1) {
   8467   int16x8_t __ret;
   8468   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8469   return __ret;
   8470 }
   8471 #else
   8472 __ai __attribute__((target("neon"))) int16x8_t vcombine_s16(int16x4_t __p0, int16x4_t __p1) {
   8473   int16x8_t __ret;
   8474   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8475   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   8476   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7);
   8477   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   8478   return __ret;
   8479 }
   8480 __ai __attribute__((target("neon"))) int16x8_t __noswap_vcombine_s16(int16x4_t __p0, int16x4_t __p1) {
   8481   int16x8_t __ret;
   8482   __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7);
   8483   return __ret;
   8484 }
   8485 #endif
   8486 
   8487 #define vcreate_p8(__p0) __extension__ ({ \
   8488   poly8x8_t __ret; \
   8489   uint64_t __promote = __p0; \
   8490   __ret = (poly8x8_t)(__promote); \
   8491   __ret; \
   8492 })
   8493 #define vcreate_p16(__p0) __extension__ ({ \
   8494   poly16x4_t __ret; \
   8495   uint64_t __promote = __p0; \
   8496   __ret = (poly16x4_t)(__promote); \
   8497   __ret; \
   8498 })
   8499 #define vcreate_u8(__p0) __extension__ ({ \
   8500   uint8x8_t __ret; \
   8501   uint64_t __promote = __p0; \
   8502   __ret = (uint8x8_t)(__promote); \
   8503   __ret; \
   8504 })
   8505 #define vcreate_u32(__p0) __extension__ ({ \
   8506   uint32x2_t __ret; \
   8507   uint64_t __promote = __p0; \
   8508   __ret = (uint32x2_t)(__promote); \
   8509   __ret; \
   8510 })
   8511 #define vcreate_u64(__p0) __extension__ ({ \
   8512   uint64x1_t __ret; \
   8513   uint64_t __promote = __p0; \
   8514   __ret = (uint64x1_t)(__promote); \
   8515   __ret; \
   8516 })
   8517 #define vcreate_u16(__p0) __extension__ ({ \
   8518   uint16x4_t __ret; \
   8519   uint64_t __promote = __p0; \
   8520   __ret = (uint16x4_t)(__promote); \
   8521   __ret; \
   8522 })
   8523 #define vcreate_s8(__p0) __extension__ ({ \
   8524   int8x8_t __ret; \
   8525   uint64_t __promote = __p0; \
   8526   __ret = (int8x8_t)(__promote); \
   8527   __ret; \
   8528 })
   8529 #define vcreate_f32(__p0) __extension__ ({ \
   8530   float32x2_t __ret; \
   8531   uint64_t __promote = __p0; \
   8532   __ret = (float32x2_t)(__promote); \
   8533   __ret; \
   8534 })
   8535 #define vcreate_f16(__p0) __extension__ ({ \
   8536   float16x4_t __ret; \
   8537   uint64_t __promote = __p0; \
   8538   __ret = (float16x4_t)(__promote); \
   8539   __ret; \
   8540 })
   8541 #define vcreate_s32(__p0) __extension__ ({ \
   8542   int32x2_t __ret; \
   8543   uint64_t __promote = __p0; \
   8544   __ret = (int32x2_t)(__promote); \
   8545   __ret; \
   8546 })
   8547 #define vcreate_s64(__p0) __extension__ ({ \
   8548   int64x1_t __ret; \
   8549   uint64_t __promote = __p0; \
   8550   __ret = (int64x1_t)(__promote); \
   8551   __ret; \
   8552 })
   8553 #define vcreate_s16(__p0) __extension__ ({ \
   8554   int16x4_t __ret; \
   8555   uint64_t __promote = __p0; \
   8556   __ret = (int16x4_t)(__promote); \
   8557   __ret; \
   8558 })
   8559 #ifdef __LITTLE_ENDIAN__
   8560 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_u32(uint32x4_t __p0) {
   8561   float32x4_t __ret;
   8562   __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__p0, 50);
   8563   return __ret;
   8564 }
   8565 #else
   8566 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_u32(uint32x4_t __p0) {
   8567   float32x4_t __ret;
   8568   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8569   __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__rev0, 50);
   8570   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8571   return __ret;
   8572 }
   8573 #endif
   8574 
   8575 #ifdef __LITTLE_ENDIAN__
   8576 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_s32(int32x4_t __p0) {
   8577   float32x4_t __ret;
   8578   __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__p0, 34);
   8579   return __ret;
   8580 }
   8581 #else
   8582 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_s32(int32x4_t __p0) {
   8583   float32x4_t __ret;
   8584   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8585   __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__rev0, 34);
   8586   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8587   return __ret;
   8588 }
   8589 #endif
   8590 
   8591 #ifdef __LITTLE_ENDIAN__
   8592 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_u32(uint32x2_t __p0) {
   8593   float32x2_t __ret;
   8594   __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__p0, 18);
   8595   return __ret;
   8596 }
   8597 #else
   8598 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_u32(uint32x2_t __p0) {
   8599   float32x2_t __ret;
   8600   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8601   __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__rev0, 18);
   8602   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8603   return __ret;
   8604 }
   8605 #endif
   8606 
   8607 #ifdef __LITTLE_ENDIAN__
   8608 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_s32(int32x2_t __p0) {
   8609   float32x2_t __ret;
   8610   __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__p0, 2);
   8611   return __ret;
   8612 }
   8613 #else
   8614 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_s32(int32x2_t __p0) {
   8615   float32x2_t __ret;
   8616   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8617   __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__rev0, 2);
   8618   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8619   return __ret;
   8620 }
   8621 #endif
   8622 
   8623 #ifdef __LITTLE_ENDIAN__
   8624 #define vcvtq_n_f32_u32(__p0, __p1) __extension__ ({ \
   8625   float32x4_t __ret; \
   8626   uint32x4_t __s0 = __p0; \
   8627   __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__s0, __p1, 50); \
   8628   __ret; \
   8629 })
   8630 #else
   8631 #define vcvtq_n_f32_u32(__p0, __p1) __extension__ ({ \
   8632   float32x4_t __ret; \
   8633   uint32x4_t __s0 = __p0; \
   8634   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   8635   __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__rev0, __p1, 50); \
   8636   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   8637   __ret; \
   8638 })
   8639 #endif
   8640 
   8641 #ifdef __LITTLE_ENDIAN__
   8642 #define vcvtq_n_f32_s32(__p0, __p1) __extension__ ({ \
   8643   float32x4_t __ret; \
   8644   int32x4_t __s0 = __p0; \
   8645   __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__s0, __p1, 34); \
   8646   __ret; \
   8647 })
   8648 #else
   8649 #define vcvtq_n_f32_s32(__p0, __p1) __extension__ ({ \
   8650   float32x4_t __ret; \
   8651   int32x4_t __s0 = __p0; \
   8652   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   8653   __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__rev0, __p1, 34); \
   8654   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   8655   __ret; \
   8656 })
   8657 #endif
   8658 
   8659 #ifdef __LITTLE_ENDIAN__
   8660 #define vcvt_n_f32_u32(__p0, __p1) __extension__ ({ \
   8661   float32x2_t __ret; \
   8662   uint32x2_t __s0 = __p0; \
   8663   __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__s0, __p1, 18); \
   8664   __ret; \
   8665 })
   8666 #else
   8667 #define vcvt_n_f32_u32(__p0, __p1) __extension__ ({ \
   8668   float32x2_t __ret; \
   8669   uint32x2_t __s0 = __p0; \
   8670   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   8671   __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__rev0, __p1, 18); \
   8672   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   8673   __ret; \
   8674 })
   8675 #endif
   8676 
   8677 #ifdef __LITTLE_ENDIAN__
   8678 #define vcvt_n_f32_s32(__p0, __p1) __extension__ ({ \
   8679   float32x2_t __ret; \
   8680   int32x2_t __s0 = __p0; \
   8681   __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__s0, __p1, 2); \
   8682   __ret; \
   8683 })
   8684 #else
   8685 #define vcvt_n_f32_s32(__p0, __p1) __extension__ ({ \
   8686   float32x2_t __ret; \
   8687   int32x2_t __s0 = __p0; \
   8688   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   8689   __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__rev0, __p1, 2); \
   8690   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   8691   __ret; \
   8692 })
   8693 #endif
   8694 
   8695 #ifdef __LITTLE_ENDIAN__
   8696 #define vcvtq_n_s32_f32(__p0, __p1) __extension__ ({ \
   8697   int32x4_t __ret; \
   8698   float32x4_t __s0 = __p0; \
   8699   __ret = (int32x4_t) __builtin_neon_vcvtq_n_s32_v((int8x16_t)__s0, __p1, 34); \
   8700   __ret; \
   8701 })
   8702 #else
   8703 #define vcvtq_n_s32_f32(__p0, __p1) __extension__ ({ \
   8704   int32x4_t __ret; \
   8705   float32x4_t __s0 = __p0; \
   8706   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   8707   __ret = (int32x4_t) __builtin_neon_vcvtq_n_s32_v((int8x16_t)__rev0, __p1, 34); \
   8708   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   8709   __ret; \
   8710 })
   8711 #endif
   8712 
   8713 #ifdef __LITTLE_ENDIAN__
   8714 #define vcvt_n_s32_f32(__p0, __p1) __extension__ ({ \
   8715   int32x2_t __ret; \
   8716   float32x2_t __s0 = __p0; \
   8717   __ret = (int32x2_t) __builtin_neon_vcvt_n_s32_v((int8x8_t)__s0, __p1, 2); \
   8718   __ret; \
   8719 })
   8720 #else
   8721 #define vcvt_n_s32_f32(__p0, __p1) __extension__ ({ \
   8722   int32x2_t __ret; \
   8723   float32x2_t __s0 = __p0; \
   8724   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   8725   __ret = (int32x2_t) __builtin_neon_vcvt_n_s32_v((int8x8_t)__rev0, __p1, 2); \
   8726   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   8727   __ret; \
   8728 })
   8729 #endif
   8730 
   8731 #ifdef __LITTLE_ENDIAN__
   8732 #define vcvtq_n_u32_f32(__p0, __p1) __extension__ ({ \
   8733   uint32x4_t __ret; \
   8734   float32x4_t __s0 = __p0; \
   8735   __ret = (uint32x4_t) __builtin_neon_vcvtq_n_u32_v((int8x16_t)__s0, __p1, 50); \
   8736   __ret; \
   8737 })
   8738 #else
   8739 #define vcvtq_n_u32_f32(__p0, __p1) __extension__ ({ \
   8740   uint32x4_t __ret; \
   8741   float32x4_t __s0 = __p0; \
   8742   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   8743   __ret = (uint32x4_t) __builtin_neon_vcvtq_n_u32_v((int8x16_t)__rev0, __p1, 50); \
   8744   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   8745   __ret; \
   8746 })
   8747 #endif
   8748 
   8749 #ifdef __LITTLE_ENDIAN__
   8750 #define vcvt_n_u32_f32(__p0, __p1) __extension__ ({ \
   8751   uint32x2_t __ret; \
   8752   float32x2_t __s0 = __p0; \
   8753   __ret = (uint32x2_t) __builtin_neon_vcvt_n_u32_v((int8x8_t)__s0, __p1, 18); \
   8754   __ret; \
   8755 })
   8756 #else
   8757 #define vcvt_n_u32_f32(__p0, __p1) __extension__ ({ \
   8758   uint32x2_t __ret; \
   8759   float32x2_t __s0 = __p0; \
   8760   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   8761   __ret = (uint32x2_t) __builtin_neon_vcvt_n_u32_v((int8x8_t)__rev0, __p1, 18); \
   8762   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   8763   __ret; \
   8764 })
   8765 #endif
   8766 
   8767 #ifdef __LITTLE_ENDIAN__
   8768 __ai __attribute__((target("neon"))) int32x4_t vcvtq_s32_f32(float32x4_t __p0) {
   8769   int32x4_t __ret;
   8770   __ret = (int32x4_t) __builtin_neon_vcvtq_s32_v((int8x16_t)__p0, 34);
   8771   return __ret;
   8772 }
   8773 #else
   8774 __ai __attribute__((target("neon"))) int32x4_t vcvtq_s32_f32(float32x4_t __p0) {
   8775   int32x4_t __ret;
   8776   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8777   __ret = (int32x4_t) __builtin_neon_vcvtq_s32_v((int8x16_t)__rev0, 34);
   8778   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8779   return __ret;
   8780 }
   8781 #endif
   8782 
   8783 #ifdef __LITTLE_ENDIAN__
   8784 __ai __attribute__((target("neon"))) int32x2_t vcvt_s32_f32(float32x2_t __p0) {
   8785   int32x2_t __ret;
   8786   __ret = (int32x2_t) __builtin_neon_vcvt_s32_v((int8x8_t)__p0, 2);
   8787   return __ret;
   8788 }
   8789 #else
   8790 __ai __attribute__((target("neon"))) int32x2_t vcvt_s32_f32(float32x2_t __p0) {
   8791   int32x2_t __ret;
   8792   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8793   __ret = (int32x2_t) __builtin_neon_vcvt_s32_v((int8x8_t)__rev0, 2);
   8794   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8795   return __ret;
   8796 }
   8797 #endif
   8798 
   8799 #ifdef __LITTLE_ENDIAN__
   8800 __ai __attribute__((target("neon"))) uint32x4_t vcvtq_u32_f32(float32x4_t __p0) {
   8801   uint32x4_t __ret;
   8802   __ret = (uint32x4_t) __builtin_neon_vcvtq_u32_v((int8x16_t)__p0, 50);
   8803   return __ret;
   8804 }
   8805 #else
   8806 __ai __attribute__((target("neon"))) uint32x4_t vcvtq_u32_f32(float32x4_t __p0) {
   8807   uint32x4_t __ret;
   8808   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   8809   __ret = (uint32x4_t) __builtin_neon_vcvtq_u32_v((int8x16_t)__rev0, 50);
   8810   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   8811   return __ret;
   8812 }
   8813 #endif
   8814 
   8815 #ifdef __LITTLE_ENDIAN__
   8816 __ai __attribute__((target("neon"))) uint32x2_t vcvt_u32_f32(float32x2_t __p0) {
   8817   uint32x2_t __ret;
   8818   __ret = (uint32x2_t) __builtin_neon_vcvt_u32_v((int8x8_t)__p0, 18);
   8819   return __ret;
   8820 }
   8821 #else
   8822 __ai __attribute__((target("neon"))) uint32x2_t vcvt_u32_f32(float32x2_t __p0) {
   8823   uint32x2_t __ret;
   8824   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   8825   __ret = (uint32x2_t) __builtin_neon_vcvt_u32_v((int8x8_t)__rev0, 18);
   8826   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   8827   return __ret;
   8828 }
   8829 #endif
   8830 
   8831 #ifdef __LITTLE_ENDIAN__
   8832 #define vdup_lane_p8(__p0_8, __p1_8) __extension__ ({ \
   8833   poly8x8_t __ret_8; \
   8834   poly8x8_t __s0_8 = __p0_8; \
   8835   __ret_8 = splat_lane_p8(__s0_8, __p1_8); \
   8836   __ret_8; \
   8837 })
   8838 #else
   8839 #define vdup_lane_p8(__p0_9, __p1_9) __extension__ ({ \
   8840   poly8x8_t __ret_9; \
   8841   poly8x8_t __s0_9 = __p0_9; \
   8842   poly8x8_t __rev0_9;  __rev0_9 = __builtin_shufflevector(__s0_9, __s0_9, 7, 6, 5, 4, 3, 2, 1, 0); \
   8843   __ret_9 = __noswap_splat_lane_p8(__rev0_9, __p1_9); \
   8844   __ret_9 = __builtin_shufflevector(__ret_9, __ret_9, 7, 6, 5, 4, 3, 2, 1, 0); \
   8845   __ret_9; \
   8846 })
   8847 #endif
   8848 
   8849 #ifdef __LITTLE_ENDIAN__
   8850 #define vdup_lane_p16(__p0_10, __p1_10) __extension__ ({ \
   8851   poly16x4_t __ret_10; \
   8852   poly16x4_t __s0_10 = __p0_10; \
   8853   __ret_10 = splat_lane_p16(__s0_10, __p1_10); \
   8854   __ret_10; \
   8855 })
   8856 #else
   8857 #define vdup_lane_p16(__p0_11, __p1_11) __extension__ ({ \
   8858   poly16x4_t __ret_11; \
   8859   poly16x4_t __s0_11 = __p0_11; \
   8860   poly16x4_t __rev0_11;  __rev0_11 = __builtin_shufflevector(__s0_11, __s0_11, 3, 2, 1, 0); \
   8861   __ret_11 = __noswap_splat_lane_p16(__rev0_11, __p1_11); \
   8862   __ret_11 = __builtin_shufflevector(__ret_11, __ret_11, 3, 2, 1, 0); \
   8863   __ret_11; \
   8864 })
   8865 #endif
   8866 
   8867 #ifdef __LITTLE_ENDIAN__
   8868 #define vdupq_lane_p8(__p0_12, __p1_12) __extension__ ({ \
   8869   poly8x16_t __ret_12; \
   8870   poly8x8_t __s0_12 = __p0_12; \
   8871   __ret_12 = splatq_lane_p8(__s0_12, __p1_12); \
   8872   __ret_12; \
   8873 })
   8874 #else
   8875 #define vdupq_lane_p8(__p0_13, __p1_13) __extension__ ({ \
   8876   poly8x16_t __ret_13; \
   8877   poly8x8_t __s0_13 = __p0_13; \
   8878   poly8x8_t __rev0_13;  __rev0_13 = __builtin_shufflevector(__s0_13, __s0_13, 7, 6, 5, 4, 3, 2, 1, 0); \
   8879   __ret_13 = __noswap_splatq_lane_p8(__rev0_13, __p1_13); \
   8880   __ret_13 = __builtin_shufflevector(__ret_13, __ret_13, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   8881   __ret_13; \
   8882 })
   8883 #endif
   8884 
   8885 #ifdef __LITTLE_ENDIAN__
   8886 #define vdupq_lane_p16(__p0_14, __p1_14) __extension__ ({ \
   8887   poly16x8_t __ret_14; \
   8888   poly16x4_t __s0_14 = __p0_14; \
   8889   __ret_14 = splatq_lane_p16(__s0_14, __p1_14); \
   8890   __ret_14; \
   8891 })
   8892 #else
   8893 #define vdupq_lane_p16(__p0_15, __p1_15) __extension__ ({ \
   8894   poly16x8_t __ret_15; \
   8895   poly16x4_t __s0_15 = __p0_15; \
   8896   poly16x4_t __rev0_15;  __rev0_15 = __builtin_shufflevector(__s0_15, __s0_15, 3, 2, 1, 0); \
   8897   __ret_15 = __noswap_splatq_lane_p16(__rev0_15, __p1_15); \
   8898   __ret_15 = __builtin_shufflevector(__ret_15, __ret_15, 7, 6, 5, 4, 3, 2, 1, 0); \
   8899   __ret_15; \
   8900 })
   8901 #endif
   8902 
   8903 #ifdef __LITTLE_ENDIAN__
   8904 #define vdupq_lane_u8(__p0_16, __p1_16) __extension__ ({ \
   8905   uint8x16_t __ret_16; \
   8906   uint8x8_t __s0_16 = __p0_16; \
   8907   __ret_16 = splatq_lane_u8(__s0_16, __p1_16); \
   8908   __ret_16; \
   8909 })
   8910 #else
   8911 #define vdupq_lane_u8(__p0_17, __p1_17) __extension__ ({ \
   8912   uint8x16_t __ret_17; \
   8913   uint8x8_t __s0_17 = __p0_17; \
   8914   uint8x8_t __rev0_17;  __rev0_17 = __builtin_shufflevector(__s0_17, __s0_17, 7, 6, 5, 4, 3, 2, 1, 0); \
   8915   __ret_17 = __noswap_splatq_lane_u8(__rev0_17, __p1_17); \
   8916   __ret_17 = __builtin_shufflevector(__ret_17, __ret_17, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   8917   __ret_17; \
   8918 })
   8919 #endif
   8920 
   8921 #ifdef __LITTLE_ENDIAN__
   8922 #define vdupq_lane_u32(__p0_18, __p1_18) __extension__ ({ \
   8923   uint32x4_t __ret_18; \
   8924   uint32x2_t __s0_18 = __p0_18; \
   8925   __ret_18 = splatq_lane_u32(__s0_18, __p1_18); \
   8926   __ret_18; \
   8927 })
   8928 #else
   8929 #define vdupq_lane_u32(__p0_19, __p1_19) __extension__ ({ \
   8930   uint32x4_t __ret_19; \
   8931   uint32x2_t __s0_19 = __p0_19; \
   8932   uint32x2_t __rev0_19;  __rev0_19 = __builtin_shufflevector(__s0_19, __s0_19, 1, 0); \
   8933   __ret_19 = __noswap_splatq_lane_u32(__rev0_19, __p1_19); \
   8934   __ret_19 = __builtin_shufflevector(__ret_19, __ret_19, 3, 2, 1, 0); \
   8935   __ret_19; \
   8936 })
   8937 #endif
   8938 
   8939 #ifdef __LITTLE_ENDIAN__
   8940 #define vdupq_lane_u64(__p0_20, __p1_20) __extension__ ({ \
   8941   uint64x2_t __ret_20; \
   8942   uint64x1_t __s0_20 = __p0_20; \
   8943   __ret_20 = splatq_lane_u64(__s0_20, __p1_20); \
   8944   __ret_20; \
   8945 })
   8946 #else
   8947 #define vdupq_lane_u64(__p0_21, __p1_21) __extension__ ({ \
   8948   uint64x2_t __ret_21; \
   8949   uint64x1_t __s0_21 = __p0_21; \
   8950   __ret_21 = __noswap_splatq_lane_u64(__s0_21, __p1_21); \
   8951   __ret_21 = __builtin_shufflevector(__ret_21, __ret_21, 1, 0); \
   8952   __ret_21; \
   8953 })
   8954 #endif
   8955 
   8956 #ifdef __LITTLE_ENDIAN__
   8957 #define vdupq_lane_u16(__p0_22, __p1_22) __extension__ ({ \
   8958   uint16x8_t __ret_22; \
   8959   uint16x4_t __s0_22 = __p0_22; \
   8960   __ret_22 = splatq_lane_u16(__s0_22, __p1_22); \
   8961   __ret_22; \
   8962 })
   8963 #else
   8964 #define vdupq_lane_u16(__p0_23, __p1_23) __extension__ ({ \
   8965   uint16x8_t __ret_23; \
   8966   uint16x4_t __s0_23 = __p0_23; \
   8967   uint16x4_t __rev0_23;  __rev0_23 = __builtin_shufflevector(__s0_23, __s0_23, 3, 2, 1, 0); \
   8968   __ret_23 = __noswap_splatq_lane_u16(__rev0_23, __p1_23); \
   8969   __ret_23 = __builtin_shufflevector(__ret_23, __ret_23, 7, 6, 5, 4, 3, 2, 1, 0); \
   8970   __ret_23; \
   8971 })
   8972 #endif
   8973 
   8974 #ifdef __LITTLE_ENDIAN__
   8975 #define vdupq_lane_s8(__p0_24, __p1_24) __extension__ ({ \
   8976   int8x16_t __ret_24; \
   8977   int8x8_t __s0_24 = __p0_24; \
   8978   __ret_24 = splatq_lane_s8(__s0_24, __p1_24); \
   8979   __ret_24; \
   8980 })
   8981 #else
   8982 #define vdupq_lane_s8(__p0_25, __p1_25) __extension__ ({ \
   8983   int8x16_t __ret_25; \
   8984   int8x8_t __s0_25 = __p0_25; \
   8985   int8x8_t __rev0_25;  __rev0_25 = __builtin_shufflevector(__s0_25, __s0_25, 7, 6, 5, 4, 3, 2, 1, 0); \
   8986   __ret_25 = __noswap_splatq_lane_s8(__rev0_25, __p1_25); \
   8987   __ret_25 = __builtin_shufflevector(__ret_25, __ret_25, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   8988   __ret_25; \
   8989 })
   8990 #endif
   8991 
   8992 #ifdef __LITTLE_ENDIAN__
   8993 #define vdupq_lane_f32(__p0_26, __p1_26) __extension__ ({ \
   8994   float32x4_t __ret_26; \
   8995   float32x2_t __s0_26 = __p0_26; \
   8996   __ret_26 = splatq_lane_f32(__s0_26, __p1_26); \
   8997   __ret_26; \
   8998 })
   8999 #else
   9000 #define vdupq_lane_f32(__p0_27, __p1_27) __extension__ ({ \
   9001   float32x4_t __ret_27; \
   9002   float32x2_t __s0_27 = __p0_27; \
   9003   float32x2_t __rev0_27;  __rev0_27 = __builtin_shufflevector(__s0_27, __s0_27, 1, 0); \
   9004   __ret_27 = __noswap_splatq_lane_f32(__rev0_27, __p1_27); \
   9005   __ret_27 = __builtin_shufflevector(__ret_27, __ret_27, 3, 2, 1, 0); \
   9006   __ret_27; \
   9007 })
   9008 #endif
   9009 
   9010 #ifdef __LITTLE_ENDIAN__
   9011 #define vdupq_lane_f16(__p0_28, __p1_28) __extension__ ({ \
   9012   float16x8_t __ret_28; \
   9013   float16x4_t __s0_28 = __p0_28; \
   9014   __ret_28 = splatq_lane_f16(__s0_28, __p1_28); \
   9015   __ret_28; \
   9016 })
   9017 #else
   9018 #define vdupq_lane_f16(__p0_29, __p1_29) __extension__ ({ \
   9019   float16x8_t __ret_29; \
   9020   float16x4_t __s0_29 = __p0_29; \
   9021   float16x4_t __rev0_29;  __rev0_29 = __builtin_shufflevector(__s0_29, __s0_29, 3, 2, 1, 0); \
   9022   __ret_29 = __noswap_splatq_lane_f16(__rev0_29, __p1_29); \
   9023   __ret_29 = __builtin_shufflevector(__ret_29, __ret_29, 7, 6, 5, 4, 3, 2, 1, 0); \
   9024   __ret_29; \
   9025 })
   9026 #endif
   9027 
   9028 #ifdef __LITTLE_ENDIAN__
   9029 #define vdupq_lane_s32(__p0_30, __p1_30) __extension__ ({ \
   9030   int32x4_t __ret_30; \
   9031   int32x2_t __s0_30 = __p0_30; \
   9032   __ret_30 = splatq_lane_s32(__s0_30, __p1_30); \
   9033   __ret_30; \
   9034 })
   9035 #else
   9036 #define vdupq_lane_s32(__p0_31, __p1_31) __extension__ ({ \
   9037   int32x4_t __ret_31; \
   9038   int32x2_t __s0_31 = __p0_31; \
   9039   int32x2_t __rev0_31;  __rev0_31 = __builtin_shufflevector(__s0_31, __s0_31, 1, 0); \
   9040   __ret_31 = __noswap_splatq_lane_s32(__rev0_31, __p1_31); \
   9041   __ret_31 = __builtin_shufflevector(__ret_31, __ret_31, 3, 2, 1, 0); \
   9042   __ret_31; \
   9043 })
   9044 #endif
   9045 
   9046 #ifdef __LITTLE_ENDIAN__
   9047 #define vdupq_lane_s64(__p0_32, __p1_32) __extension__ ({ \
   9048   int64x2_t __ret_32; \
   9049   int64x1_t __s0_32 = __p0_32; \
   9050   __ret_32 = splatq_lane_s64(__s0_32, __p1_32); \
   9051   __ret_32; \
   9052 })
   9053 #else
   9054 #define vdupq_lane_s64(__p0_33, __p1_33) __extension__ ({ \
   9055   int64x2_t __ret_33; \
   9056   int64x1_t __s0_33 = __p0_33; \
   9057   __ret_33 = __noswap_splatq_lane_s64(__s0_33, __p1_33); \
   9058   __ret_33 = __builtin_shufflevector(__ret_33, __ret_33, 1, 0); \
   9059   __ret_33; \
   9060 })
   9061 #endif
   9062 
   9063 #ifdef __LITTLE_ENDIAN__
   9064 #define vdupq_lane_s16(__p0_34, __p1_34) __extension__ ({ \
   9065   int16x8_t __ret_34; \
   9066   int16x4_t __s0_34 = __p0_34; \
   9067   __ret_34 = splatq_lane_s16(__s0_34, __p1_34); \
   9068   __ret_34; \
   9069 })
   9070 #else
   9071 #define vdupq_lane_s16(__p0_35, __p1_35) __extension__ ({ \
   9072   int16x8_t __ret_35; \
   9073   int16x4_t __s0_35 = __p0_35; \
   9074   int16x4_t __rev0_35;  __rev0_35 = __builtin_shufflevector(__s0_35, __s0_35, 3, 2, 1, 0); \
   9075   __ret_35 = __noswap_splatq_lane_s16(__rev0_35, __p1_35); \
   9076   __ret_35 = __builtin_shufflevector(__ret_35, __ret_35, 7, 6, 5, 4, 3, 2, 1, 0); \
   9077   __ret_35; \
   9078 })
   9079 #endif
   9080 
   9081 #ifdef __LITTLE_ENDIAN__
   9082 #define vdup_lane_u8(__p0_36, __p1_36) __extension__ ({ \
   9083   uint8x8_t __ret_36; \
   9084   uint8x8_t __s0_36 = __p0_36; \
   9085   __ret_36 = splat_lane_u8(__s0_36, __p1_36); \
   9086   __ret_36; \
   9087 })
   9088 #else
   9089 #define vdup_lane_u8(__p0_37, __p1_37) __extension__ ({ \
   9090   uint8x8_t __ret_37; \
   9091   uint8x8_t __s0_37 = __p0_37; \
   9092   uint8x8_t __rev0_37;  __rev0_37 = __builtin_shufflevector(__s0_37, __s0_37, 7, 6, 5, 4, 3, 2, 1, 0); \
   9093   __ret_37 = __noswap_splat_lane_u8(__rev0_37, __p1_37); \
   9094   __ret_37 = __builtin_shufflevector(__ret_37, __ret_37, 7, 6, 5, 4, 3, 2, 1, 0); \
   9095   __ret_37; \
   9096 })
   9097 #endif
   9098 
   9099 #ifdef __LITTLE_ENDIAN__
   9100 #define vdup_lane_u32(__p0_38, __p1_38) __extension__ ({ \
   9101   uint32x2_t __ret_38; \
   9102   uint32x2_t __s0_38 = __p0_38; \
   9103   __ret_38 = splat_lane_u32(__s0_38, __p1_38); \
   9104   __ret_38; \
   9105 })
   9106 #else
   9107 #define vdup_lane_u32(__p0_39, __p1_39) __extension__ ({ \
   9108   uint32x2_t __ret_39; \
   9109   uint32x2_t __s0_39 = __p0_39; \
   9110   uint32x2_t __rev0_39;  __rev0_39 = __builtin_shufflevector(__s0_39, __s0_39, 1, 0); \
   9111   __ret_39 = __noswap_splat_lane_u32(__rev0_39, __p1_39); \
   9112   __ret_39 = __builtin_shufflevector(__ret_39, __ret_39, 1, 0); \
   9113   __ret_39; \
   9114 })
   9115 #endif
   9116 
   9117 #define vdup_lane_u64(__p0_40, __p1_40) __extension__ ({ \
   9118   uint64x1_t __ret_40; \
   9119   uint64x1_t __s0_40 = __p0_40; \
   9120   __ret_40 = splat_lane_u64(__s0_40, __p1_40); \
   9121   __ret_40; \
   9122 })
   9123 #ifdef __LITTLE_ENDIAN__
   9124 #define vdup_lane_u16(__p0_41, __p1_41) __extension__ ({ \
   9125   uint16x4_t __ret_41; \
   9126   uint16x4_t __s0_41 = __p0_41; \
   9127   __ret_41 = splat_lane_u16(__s0_41, __p1_41); \
   9128   __ret_41; \
   9129 })
   9130 #else
   9131 #define vdup_lane_u16(__p0_42, __p1_42) __extension__ ({ \
   9132   uint16x4_t __ret_42; \
   9133   uint16x4_t __s0_42 = __p0_42; \
   9134   uint16x4_t __rev0_42;  __rev0_42 = __builtin_shufflevector(__s0_42, __s0_42, 3, 2, 1, 0); \
   9135   __ret_42 = __noswap_splat_lane_u16(__rev0_42, __p1_42); \
   9136   __ret_42 = __builtin_shufflevector(__ret_42, __ret_42, 3, 2, 1, 0); \
   9137   __ret_42; \
   9138 })
   9139 #endif
   9140 
   9141 #ifdef __LITTLE_ENDIAN__
   9142 #define vdup_lane_s8(__p0_43, __p1_43) __extension__ ({ \
   9143   int8x8_t __ret_43; \
   9144   int8x8_t __s0_43 = __p0_43; \
   9145   __ret_43 = splat_lane_s8(__s0_43, __p1_43); \
   9146   __ret_43; \
   9147 })
   9148 #else
   9149 #define vdup_lane_s8(__p0_44, __p1_44) __extension__ ({ \
   9150   int8x8_t __ret_44; \
   9151   int8x8_t __s0_44 = __p0_44; \
   9152   int8x8_t __rev0_44;  __rev0_44 = __builtin_shufflevector(__s0_44, __s0_44, 7, 6, 5, 4, 3, 2, 1, 0); \
   9153   __ret_44 = __noswap_splat_lane_s8(__rev0_44, __p1_44); \
   9154   __ret_44 = __builtin_shufflevector(__ret_44, __ret_44, 7, 6, 5, 4, 3, 2, 1, 0); \
   9155   __ret_44; \
   9156 })
   9157 #endif
   9158 
   9159 #ifdef __LITTLE_ENDIAN__
   9160 #define vdup_lane_f32(__p0_45, __p1_45) __extension__ ({ \
   9161   float32x2_t __ret_45; \
   9162   float32x2_t __s0_45 = __p0_45; \
   9163   __ret_45 = splat_lane_f32(__s0_45, __p1_45); \
   9164   __ret_45; \
   9165 })
   9166 #else
   9167 #define vdup_lane_f32(__p0_46, __p1_46) __extension__ ({ \
   9168   float32x2_t __ret_46; \
   9169   float32x2_t __s0_46 = __p0_46; \
   9170   float32x2_t __rev0_46;  __rev0_46 = __builtin_shufflevector(__s0_46, __s0_46, 1, 0); \
   9171   __ret_46 = __noswap_splat_lane_f32(__rev0_46, __p1_46); \
   9172   __ret_46 = __builtin_shufflevector(__ret_46, __ret_46, 1, 0); \
   9173   __ret_46; \
   9174 })
   9175 #endif
   9176 
   9177 #ifdef __LITTLE_ENDIAN__
   9178 #define vdup_lane_f16(__p0_47, __p1_47) __extension__ ({ \
   9179   float16x4_t __ret_47; \
   9180   float16x4_t __s0_47 = __p0_47; \
   9181   __ret_47 = splat_lane_f16(__s0_47, __p1_47); \
   9182   __ret_47; \
   9183 })
   9184 #else
   9185 #define vdup_lane_f16(__p0_48, __p1_48) __extension__ ({ \
   9186   float16x4_t __ret_48; \
   9187   float16x4_t __s0_48 = __p0_48; \
   9188   float16x4_t __rev0_48;  __rev0_48 = __builtin_shufflevector(__s0_48, __s0_48, 3, 2, 1, 0); \
   9189   __ret_48 = __noswap_splat_lane_f16(__rev0_48, __p1_48); \
   9190   __ret_48 = __builtin_shufflevector(__ret_48, __ret_48, 3, 2, 1, 0); \
   9191   __ret_48; \
   9192 })
   9193 #endif
   9194 
   9195 #ifdef __LITTLE_ENDIAN__
   9196 #define vdup_lane_s32(__p0_49, __p1_49) __extension__ ({ \
   9197   int32x2_t __ret_49; \
   9198   int32x2_t __s0_49 = __p0_49; \
   9199   __ret_49 = splat_lane_s32(__s0_49, __p1_49); \
   9200   __ret_49; \
   9201 })
   9202 #else
   9203 #define vdup_lane_s32(__p0_50, __p1_50) __extension__ ({ \
   9204   int32x2_t __ret_50; \
   9205   int32x2_t __s0_50 = __p0_50; \
   9206   int32x2_t __rev0_50;  __rev0_50 = __builtin_shufflevector(__s0_50, __s0_50, 1, 0); \
   9207   __ret_50 = __noswap_splat_lane_s32(__rev0_50, __p1_50); \
   9208   __ret_50 = __builtin_shufflevector(__ret_50, __ret_50, 1, 0); \
   9209   __ret_50; \
   9210 })
   9211 #endif
   9212 
   9213 #define vdup_lane_s64(__p0_51, __p1_51) __extension__ ({ \
   9214   int64x1_t __ret_51; \
   9215   int64x1_t __s0_51 = __p0_51; \
   9216   __ret_51 = splat_lane_s64(__s0_51, __p1_51); \
   9217   __ret_51; \
   9218 })
   9219 #ifdef __LITTLE_ENDIAN__
   9220 #define vdup_lane_s16(__p0_52, __p1_52) __extension__ ({ \
   9221   int16x4_t __ret_52; \
   9222   int16x4_t __s0_52 = __p0_52; \
   9223   __ret_52 = splat_lane_s16(__s0_52, __p1_52); \
   9224   __ret_52; \
   9225 })
   9226 #else
   9227 #define vdup_lane_s16(__p0_53, __p1_53) __extension__ ({ \
   9228   int16x4_t __ret_53; \
   9229   int16x4_t __s0_53 = __p0_53; \
   9230   int16x4_t __rev0_53;  __rev0_53 = __builtin_shufflevector(__s0_53, __s0_53, 3, 2, 1, 0); \
   9231   __ret_53 = __noswap_splat_lane_s16(__rev0_53, __p1_53); \
   9232   __ret_53 = __builtin_shufflevector(__ret_53, __ret_53, 3, 2, 1, 0); \
   9233   __ret_53; \
   9234 })
   9235 #endif
   9236 
   9237 #ifdef __LITTLE_ENDIAN__
   9238 __ai __attribute__((target("neon"))) poly8x8_t vdup_n_p8(poly8_t __p0) {
   9239   poly8x8_t __ret;
   9240   __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9241   return __ret;
   9242 }
   9243 #else
   9244 __ai __attribute__((target("neon"))) poly8x8_t vdup_n_p8(poly8_t __p0) {
   9245   poly8x8_t __ret;
   9246   __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9247   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9248   return __ret;
   9249 }
   9250 #endif
   9251 
   9252 #ifdef __LITTLE_ENDIAN__
   9253 __ai __attribute__((target("neon"))) poly16x4_t vdup_n_p16(poly16_t __p0) {
   9254   poly16x4_t __ret;
   9255   __ret = (poly16x4_t) {__p0, __p0, __p0, __p0};
   9256   return __ret;
   9257 }
   9258 #else
   9259 __ai __attribute__((target("neon"))) poly16x4_t vdup_n_p16(poly16_t __p0) {
   9260   poly16x4_t __ret;
   9261   __ret = (poly16x4_t) {__p0, __p0, __p0, __p0};
   9262   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9263   return __ret;
   9264 }
   9265 #endif
   9266 
   9267 #ifdef __LITTLE_ENDIAN__
   9268 __ai __attribute__((target("neon"))) poly8x16_t vdupq_n_p8(poly8_t __p0) {
   9269   poly8x16_t __ret;
   9270   __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9271   return __ret;
   9272 }
   9273 #else
   9274 __ai __attribute__((target("neon"))) poly8x16_t vdupq_n_p8(poly8_t __p0) {
   9275   poly8x16_t __ret;
   9276   __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9277   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9278   return __ret;
   9279 }
   9280 #endif
   9281 
   9282 #ifdef __LITTLE_ENDIAN__
   9283 __ai __attribute__((target("neon"))) poly16x8_t vdupq_n_p16(poly16_t __p0) {
   9284   poly16x8_t __ret;
   9285   __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9286   return __ret;
   9287 }
   9288 #else
   9289 __ai __attribute__((target("neon"))) poly16x8_t vdupq_n_p16(poly16_t __p0) {
   9290   poly16x8_t __ret;
   9291   __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9292   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9293   return __ret;
   9294 }
   9295 #endif
   9296 
   9297 #ifdef __LITTLE_ENDIAN__
   9298 __ai __attribute__((target("neon"))) uint8x16_t vdupq_n_u8(uint8_t __p0) {
   9299   uint8x16_t __ret;
   9300   __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9301   return __ret;
   9302 }
   9303 #else
   9304 __ai __attribute__((target("neon"))) uint8x16_t vdupq_n_u8(uint8_t __p0) {
   9305   uint8x16_t __ret;
   9306   __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9307   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9308   return __ret;
   9309 }
   9310 #endif
   9311 
   9312 #ifdef __LITTLE_ENDIAN__
   9313 __ai __attribute__((target("neon"))) uint32x4_t vdupq_n_u32(uint32_t __p0) {
   9314   uint32x4_t __ret;
   9315   __ret = (uint32x4_t) {__p0, __p0, __p0, __p0};
   9316   return __ret;
   9317 }
   9318 #else
   9319 __ai __attribute__((target("neon"))) uint32x4_t vdupq_n_u32(uint32_t __p0) {
   9320   uint32x4_t __ret;
   9321   __ret = (uint32x4_t) {__p0, __p0, __p0, __p0};
   9322   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9323   return __ret;
   9324 }
   9325 #endif
   9326 
   9327 #ifdef __LITTLE_ENDIAN__
   9328 __ai __attribute__((target("neon"))) uint64x2_t vdupq_n_u64(uint64_t __p0) {
   9329   uint64x2_t __ret;
   9330   __ret = (uint64x2_t) {__p0, __p0};
   9331   return __ret;
   9332 }
   9333 #else
   9334 __ai __attribute__((target("neon"))) uint64x2_t vdupq_n_u64(uint64_t __p0) {
   9335   uint64x2_t __ret;
   9336   __ret = (uint64x2_t) {__p0, __p0};
   9337   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9338   return __ret;
   9339 }
   9340 #endif
   9341 
   9342 #ifdef __LITTLE_ENDIAN__
   9343 __ai __attribute__((target("neon"))) uint16x8_t vdupq_n_u16(uint16_t __p0) {
   9344   uint16x8_t __ret;
   9345   __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9346   return __ret;
   9347 }
   9348 #else
   9349 __ai __attribute__((target("neon"))) uint16x8_t vdupq_n_u16(uint16_t __p0) {
   9350   uint16x8_t __ret;
   9351   __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9352   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9353   return __ret;
   9354 }
   9355 #endif
   9356 
   9357 #ifdef __LITTLE_ENDIAN__
   9358 __ai __attribute__((target("neon"))) int8x16_t vdupq_n_s8(int8_t __p0) {
   9359   int8x16_t __ret;
   9360   __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9361   return __ret;
   9362 }
   9363 #else
   9364 __ai __attribute__((target("neon"))) int8x16_t vdupq_n_s8(int8_t __p0) {
   9365   int8x16_t __ret;
   9366   __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9367   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9368   return __ret;
   9369 }
   9370 #endif
   9371 
   9372 #ifdef __LITTLE_ENDIAN__
   9373 __ai __attribute__((target("neon"))) float32x4_t vdupq_n_f32(float32_t __p0) {
   9374   float32x4_t __ret;
   9375   __ret = (float32x4_t) {__p0, __p0, __p0, __p0};
   9376   return __ret;
   9377 }
   9378 #else
   9379 __ai __attribute__((target("neon"))) float32x4_t vdupq_n_f32(float32_t __p0) {
   9380   float32x4_t __ret;
   9381   __ret = (float32x4_t) {__p0, __p0, __p0, __p0};
   9382   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9383   return __ret;
   9384 }
   9385 #endif
   9386 
   9387 #ifdef __LITTLE_ENDIAN__
   9388 #define vdupq_n_f16(__p0) __extension__ ({ \
   9389   float16x8_t __ret; \
   9390   float16_t __s0 = __p0; \
   9391   __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \
   9392   __ret; \
   9393 })
   9394 #else
   9395 #define vdupq_n_f16(__p0) __extension__ ({ \
   9396   float16x8_t __ret; \
   9397   float16_t __s0 = __p0; \
   9398   __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \
   9399   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   9400   __ret; \
   9401 })
   9402 #endif
   9403 
   9404 #ifdef __LITTLE_ENDIAN__
   9405 __ai __attribute__((target("neon"))) int32x4_t vdupq_n_s32(int32_t __p0) {
   9406   int32x4_t __ret;
   9407   __ret = (int32x4_t) {__p0, __p0, __p0, __p0};
   9408   return __ret;
   9409 }
   9410 #else
   9411 __ai __attribute__((target("neon"))) int32x4_t vdupq_n_s32(int32_t __p0) {
   9412   int32x4_t __ret;
   9413   __ret = (int32x4_t) {__p0, __p0, __p0, __p0};
   9414   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9415   return __ret;
   9416 }
   9417 #endif
   9418 
   9419 #ifdef __LITTLE_ENDIAN__
   9420 __ai __attribute__((target("neon"))) int64x2_t vdupq_n_s64(int64_t __p0) {
   9421   int64x2_t __ret;
   9422   __ret = (int64x2_t) {__p0, __p0};
   9423   return __ret;
   9424 }
   9425 #else
   9426 __ai __attribute__((target("neon"))) int64x2_t vdupq_n_s64(int64_t __p0) {
   9427   int64x2_t __ret;
   9428   __ret = (int64x2_t) {__p0, __p0};
   9429   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9430   return __ret;
   9431 }
   9432 #endif
   9433 
   9434 #ifdef __LITTLE_ENDIAN__
   9435 __ai __attribute__((target("neon"))) int16x8_t vdupq_n_s16(int16_t __p0) {
   9436   int16x8_t __ret;
   9437   __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9438   return __ret;
   9439 }
   9440 #else
   9441 __ai __attribute__((target("neon"))) int16x8_t vdupq_n_s16(int16_t __p0) {
   9442   int16x8_t __ret;
   9443   __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9444   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9445   return __ret;
   9446 }
   9447 #endif
   9448 
   9449 #ifdef __LITTLE_ENDIAN__
   9450 __ai __attribute__((target("neon"))) uint8x8_t vdup_n_u8(uint8_t __p0) {
   9451   uint8x8_t __ret;
   9452   __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9453   return __ret;
   9454 }
   9455 #else
   9456 __ai __attribute__((target("neon"))) uint8x8_t vdup_n_u8(uint8_t __p0) {
   9457   uint8x8_t __ret;
   9458   __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9459   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9460   return __ret;
   9461 }
   9462 #endif
   9463 
   9464 #ifdef __LITTLE_ENDIAN__
   9465 __ai __attribute__((target("neon"))) uint32x2_t vdup_n_u32(uint32_t __p0) {
   9466   uint32x2_t __ret;
   9467   __ret = (uint32x2_t) {__p0, __p0};
   9468   return __ret;
   9469 }
   9470 #else
   9471 __ai __attribute__((target("neon"))) uint32x2_t vdup_n_u32(uint32_t __p0) {
   9472   uint32x2_t __ret;
   9473   __ret = (uint32x2_t) {__p0, __p0};
   9474   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9475   return __ret;
   9476 }
   9477 #endif
   9478 
   9479 __ai __attribute__((target("neon"))) uint64x1_t vdup_n_u64(uint64_t __p0) {
   9480   uint64x1_t __ret;
   9481   __ret = (uint64x1_t) {__p0};
   9482   return __ret;
   9483 }
   9484 #ifdef __LITTLE_ENDIAN__
   9485 __ai __attribute__((target("neon"))) uint16x4_t vdup_n_u16(uint16_t __p0) {
   9486   uint16x4_t __ret;
   9487   __ret = (uint16x4_t) {__p0, __p0, __p0, __p0};
   9488   return __ret;
   9489 }
   9490 #else
   9491 __ai __attribute__((target("neon"))) uint16x4_t vdup_n_u16(uint16_t __p0) {
   9492   uint16x4_t __ret;
   9493   __ret = (uint16x4_t) {__p0, __p0, __p0, __p0};
   9494   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9495   return __ret;
   9496 }
   9497 #endif
   9498 
   9499 #ifdef __LITTLE_ENDIAN__
   9500 __ai __attribute__((target("neon"))) int8x8_t vdup_n_s8(int8_t __p0) {
   9501   int8x8_t __ret;
   9502   __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9503   return __ret;
   9504 }
   9505 #else
   9506 __ai __attribute__((target("neon"))) int8x8_t vdup_n_s8(int8_t __p0) {
   9507   int8x8_t __ret;
   9508   __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
   9509   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9510   return __ret;
   9511 }
   9512 #endif
   9513 
   9514 #ifdef __LITTLE_ENDIAN__
   9515 __ai __attribute__((target("neon"))) float32x2_t vdup_n_f32(float32_t __p0) {
   9516   float32x2_t __ret;
   9517   __ret = (float32x2_t) {__p0, __p0};
   9518   return __ret;
   9519 }
   9520 #else
   9521 __ai __attribute__((target("neon"))) float32x2_t vdup_n_f32(float32_t __p0) {
   9522   float32x2_t __ret;
   9523   __ret = (float32x2_t) {__p0, __p0};
   9524   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9525   return __ret;
   9526 }
   9527 #endif
   9528 
   9529 #ifdef __LITTLE_ENDIAN__
   9530 #define vdup_n_f16(__p0) __extension__ ({ \
   9531   float16x4_t __ret; \
   9532   float16_t __s0 = __p0; \
   9533   __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \
   9534   __ret; \
   9535 })
   9536 #else
   9537 #define vdup_n_f16(__p0) __extension__ ({ \
   9538   float16x4_t __ret; \
   9539   float16_t __s0 = __p0; \
   9540   __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \
   9541   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   9542   __ret; \
   9543 })
   9544 #endif
   9545 
   9546 #ifdef __LITTLE_ENDIAN__
   9547 __ai __attribute__((target("neon"))) int32x2_t vdup_n_s32(int32_t __p0) {
   9548   int32x2_t __ret;
   9549   __ret = (int32x2_t) {__p0, __p0};
   9550   return __ret;
   9551 }
   9552 #else
   9553 __ai __attribute__((target("neon"))) int32x2_t vdup_n_s32(int32_t __p0) {
   9554   int32x2_t __ret;
   9555   __ret = (int32x2_t) {__p0, __p0};
   9556   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9557   return __ret;
   9558 }
   9559 #endif
   9560 
   9561 __ai __attribute__((target("neon"))) int64x1_t vdup_n_s64(int64_t __p0) {
   9562   int64x1_t __ret;
   9563   __ret = (int64x1_t) {__p0};
   9564   return __ret;
   9565 }
   9566 #ifdef __LITTLE_ENDIAN__
   9567 __ai __attribute__((target("neon"))) int16x4_t vdup_n_s16(int16_t __p0) {
   9568   int16x4_t __ret;
   9569   __ret = (int16x4_t) {__p0, __p0, __p0, __p0};
   9570   return __ret;
   9571 }
   9572 #else
   9573 __ai __attribute__((target("neon"))) int16x4_t vdup_n_s16(int16_t __p0) {
   9574   int16x4_t __ret;
   9575   __ret = (int16x4_t) {__p0, __p0, __p0, __p0};
   9576   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9577   return __ret;
   9578 }
   9579 #endif
   9580 
   9581 #ifdef __LITTLE_ENDIAN__
   9582 __ai __attribute__((target("neon"))) uint8x16_t veorq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   9583   uint8x16_t __ret;
   9584   __ret = __p0 ^ __p1;
   9585   return __ret;
   9586 }
   9587 #else
   9588 __ai __attribute__((target("neon"))) uint8x16_t veorq_u8(uint8x16_t __p0, uint8x16_t __p1) {
   9589   uint8x16_t __ret;
   9590   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9591   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9592   __ret = __rev0 ^ __rev1;
   9593   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9594   return __ret;
   9595 }
   9596 #endif
   9597 
   9598 #ifdef __LITTLE_ENDIAN__
   9599 __ai __attribute__((target("neon"))) uint32x4_t veorq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   9600   uint32x4_t __ret;
   9601   __ret = __p0 ^ __p1;
   9602   return __ret;
   9603 }
   9604 #else
   9605 __ai __attribute__((target("neon"))) uint32x4_t veorq_u32(uint32x4_t __p0, uint32x4_t __p1) {
   9606   uint32x4_t __ret;
   9607   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   9608   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   9609   __ret = __rev0 ^ __rev1;
   9610   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9611   return __ret;
   9612 }
   9613 #endif
   9614 
   9615 #ifdef __LITTLE_ENDIAN__
   9616 __ai __attribute__((target("neon"))) uint64x2_t veorq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   9617   uint64x2_t __ret;
   9618   __ret = __p0 ^ __p1;
   9619   return __ret;
   9620 }
   9621 #else
   9622 __ai __attribute__((target("neon"))) uint64x2_t veorq_u64(uint64x2_t __p0, uint64x2_t __p1) {
   9623   uint64x2_t __ret;
   9624   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   9625   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   9626   __ret = __rev0 ^ __rev1;
   9627   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9628   return __ret;
   9629 }
   9630 #endif
   9631 
   9632 #ifdef __LITTLE_ENDIAN__
   9633 __ai __attribute__((target("neon"))) uint16x8_t veorq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   9634   uint16x8_t __ret;
   9635   __ret = __p0 ^ __p1;
   9636   return __ret;
   9637 }
   9638 #else
   9639 __ai __attribute__((target("neon"))) uint16x8_t veorq_u16(uint16x8_t __p0, uint16x8_t __p1) {
   9640   uint16x8_t __ret;
   9641   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   9642   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   9643   __ret = __rev0 ^ __rev1;
   9644   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9645   return __ret;
   9646 }
   9647 #endif
   9648 
   9649 #ifdef __LITTLE_ENDIAN__
   9650 __ai __attribute__((target("neon"))) int8x16_t veorq_s8(int8x16_t __p0, int8x16_t __p1) {
   9651   int8x16_t __ret;
   9652   __ret = __p0 ^ __p1;
   9653   return __ret;
   9654 }
   9655 #else
   9656 __ai __attribute__((target("neon"))) int8x16_t veorq_s8(int8x16_t __p0, int8x16_t __p1) {
   9657   int8x16_t __ret;
   9658   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9659   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9660   __ret = __rev0 ^ __rev1;
   9661   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
   9662   return __ret;
   9663 }
   9664 #endif
   9665 
   9666 #ifdef __LITTLE_ENDIAN__
   9667 __ai __attribute__((target("neon"))) int32x4_t veorq_s32(int32x4_t __p0, int32x4_t __p1) {
   9668   int32x4_t __ret;
   9669   __ret = __p0 ^ __p1;
   9670   return __ret;
   9671 }
   9672 #else
   9673 __ai __attribute__((target("neon"))) int32x4_t veorq_s32(int32x4_t __p0, int32x4_t __p1) {
   9674   int32x4_t __ret;
   9675   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   9676   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   9677   __ret = __rev0 ^ __rev1;
   9678   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9679   return __ret;
   9680 }
   9681 #endif
   9682 
   9683 #ifdef __LITTLE_ENDIAN__
   9684 __ai __attribute__((target("neon"))) int64x2_t veorq_s64(int64x2_t __p0, int64x2_t __p1) {
   9685   int64x2_t __ret;
   9686   __ret = __p0 ^ __p1;
   9687   return __ret;
   9688 }
   9689 #else
   9690 __ai __attribute__((target("neon"))) int64x2_t veorq_s64(int64x2_t __p0, int64x2_t __p1) {
   9691   int64x2_t __ret;
   9692   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   9693   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   9694   __ret = __rev0 ^ __rev1;
   9695   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9696   return __ret;
   9697 }
   9698 #endif
   9699 
   9700 #ifdef __LITTLE_ENDIAN__
   9701 __ai __attribute__((target("neon"))) int16x8_t veorq_s16(int16x8_t __p0, int16x8_t __p1) {
   9702   int16x8_t __ret;
   9703   __ret = __p0 ^ __p1;
   9704   return __ret;
   9705 }
   9706 #else
   9707 __ai __attribute__((target("neon"))) int16x8_t veorq_s16(int16x8_t __p0, int16x8_t __p1) {
   9708   int16x8_t __ret;
   9709   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   9710   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   9711   __ret = __rev0 ^ __rev1;
   9712   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9713   return __ret;
   9714 }
   9715 #endif
   9716 
   9717 #ifdef __LITTLE_ENDIAN__
   9718 __ai __attribute__((target("neon"))) uint8x8_t veor_u8(uint8x8_t __p0, uint8x8_t __p1) {
   9719   uint8x8_t __ret;
   9720   __ret = __p0 ^ __p1;
   9721   return __ret;
   9722 }
   9723 #else
   9724 __ai __attribute__((target("neon"))) uint8x8_t veor_u8(uint8x8_t __p0, uint8x8_t __p1) {
   9725   uint8x8_t __ret;
   9726   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   9727   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   9728   __ret = __rev0 ^ __rev1;
   9729   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9730   return __ret;
   9731 }
   9732 #endif
   9733 
   9734 #ifdef __LITTLE_ENDIAN__
   9735 __ai __attribute__((target("neon"))) uint32x2_t veor_u32(uint32x2_t __p0, uint32x2_t __p1) {
   9736   uint32x2_t __ret;
   9737   __ret = __p0 ^ __p1;
   9738   return __ret;
   9739 }
   9740 #else
   9741 __ai __attribute__((target("neon"))) uint32x2_t veor_u32(uint32x2_t __p0, uint32x2_t __p1) {
   9742   uint32x2_t __ret;
   9743   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   9744   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   9745   __ret = __rev0 ^ __rev1;
   9746   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9747   return __ret;
   9748 }
   9749 #endif
   9750 
   9751 __ai __attribute__((target("neon"))) uint64x1_t veor_u64(uint64x1_t __p0, uint64x1_t __p1) {
   9752   uint64x1_t __ret;
   9753   __ret = __p0 ^ __p1;
   9754   return __ret;
   9755 }
   9756 #ifdef __LITTLE_ENDIAN__
   9757 __ai __attribute__((target("neon"))) uint16x4_t veor_u16(uint16x4_t __p0, uint16x4_t __p1) {
   9758   uint16x4_t __ret;
   9759   __ret = __p0 ^ __p1;
   9760   return __ret;
   9761 }
   9762 #else
   9763 __ai __attribute__((target("neon"))) uint16x4_t veor_u16(uint16x4_t __p0, uint16x4_t __p1) {
   9764   uint16x4_t __ret;
   9765   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   9766   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   9767   __ret = __rev0 ^ __rev1;
   9768   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9769   return __ret;
   9770 }
   9771 #endif
   9772 
   9773 #ifdef __LITTLE_ENDIAN__
   9774 __ai __attribute__((target("neon"))) int8x8_t veor_s8(int8x8_t __p0, int8x8_t __p1) {
   9775   int8x8_t __ret;
   9776   __ret = __p0 ^ __p1;
   9777   return __ret;
   9778 }
   9779 #else
   9780 __ai __attribute__((target("neon"))) int8x8_t veor_s8(int8x8_t __p0, int8x8_t __p1) {
   9781   int8x8_t __ret;
   9782   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
   9783   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
   9784   __ret = __rev0 ^ __rev1;
   9785   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
   9786   return __ret;
   9787 }
   9788 #endif
   9789 
   9790 #ifdef __LITTLE_ENDIAN__
   9791 __ai __attribute__((target("neon"))) int32x2_t veor_s32(int32x2_t __p0, int32x2_t __p1) {
   9792   int32x2_t __ret;
   9793   __ret = __p0 ^ __p1;
   9794   return __ret;
   9795 }
   9796 #else
   9797 __ai __attribute__((target("neon"))) int32x2_t veor_s32(int32x2_t __p0, int32x2_t __p1) {
   9798   int32x2_t __ret;
   9799   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
   9800   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
   9801   __ret = __rev0 ^ __rev1;
   9802   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
   9803   return __ret;
   9804 }
   9805 #endif
   9806 
   9807 __ai __attribute__((target("neon"))) int64x1_t veor_s64(int64x1_t __p0, int64x1_t __p1) {
   9808   int64x1_t __ret;
   9809   __ret = __p0 ^ __p1;
   9810   return __ret;
   9811 }
   9812 #ifdef __LITTLE_ENDIAN__
   9813 __ai __attribute__((target("neon"))) int16x4_t veor_s16(int16x4_t __p0, int16x4_t __p1) {
   9814   int16x4_t __ret;
   9815   __ret = __p0 ^ __p1;
   9816   return __ret;
   9817 }
   9818 #else
   9819 __ai __attribute__((target("neon"))) int16x4_t veor_s16(int16x4_t __p0, int16x4_t __p1) {
   9820   int16x4_t __ret;
   9821   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
   9822   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
   9823   __ret = __rev0 ^ __rev1;
   9824   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
   9825   return __ret;
   9826 }
   9827 #endif
   9828 
   9829 #ifdef __LITTLE_ENDIAN__
   9830 #define vext_p8(__p0, __p1, __p2) __extension__ ({ \
   9831   poly8x8_t __ret; \
   9832   poly8x8_t __s0 = __p0; \
   9833   poly8x8_t __s1 = __p1; \
   9834   __ret = (poly8x8_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 4); \
   9835   __ret; \
   9836 })
   9837 #else
   9838 #define vext_p8(__p0, __p1, __p2) __extension__ ({ \
   9839   poly8x8_t __ret; \
   9840   poly8x8_t __s0 = __p0; \
   9841   poly8x8_t __s1 = __p1; \
   9842   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   9843   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
   9844   __ret = (poly8x8_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 4); \
   9845   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   9846   __ret; \
   9847 })
   9848 #endif
   9849 
   9850 #ifdef __LITTLE_ENDIAN__
   9851 #define vext_p16(__p0, __p1, __p2) __extension__ ({ \
   9852   poly16x4_t __ret; \
   9853   poly16x4_t __s0 = __p0; \
   9854   poly16x4_t __s1 = __p1; \
   9855   __ret = (poly16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 5); \
   9856   __ret; \
   9857 })
   9858 #else
   9859 #define vext_p16(__p0, __p1, __p2) __extension__ ({ \
   9860   poly16x4_t __ret; \
   9861   poly16x4_t __s0 = __p0; \
   9862   poly16x4_t __s1 = __p1; \
   9863   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   9864   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
   9865   __ret = (poly16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 5); \
   9866   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   9867   __ret; \
   9868 })
   9869 #endif
   9870 
   9871 #ifdef __LITTLE_ENDIAN__
   9872 #define vextq_p8(__p0, __p1, __p2) __extension__ ({ \
   9873   poly8x16_t __ret; \
   9874   poly8x16_t __s0 = __p0; \
   9875   poly8x16_t __s1 = __p1; \
   9876   __ret = (poly8x16_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \
   9877   __ret; \
   9878 })
   9879 #else
   9880 #define vextq_p8(__p0, __p1, __p2) __extension__ ({ \
   9881   poly8x16_t __ret; \
   9882   poly8x16_t __s0 = __p0; \
   9883   poly8x16_t __s1 = __p1; \
   9884   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   9885   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   9886   __ret = (poly8x16_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \
   9887   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   9888   __ret; \
   9889 })
   9890 #endif
   9891 
   9892 #ifdef __LITTLE_ENDIAN__
   9893 #define vextq_p16(__p0, __p1, __p2) __extension__ ({ \
   9894   poly16x8_t __ret; \
   9895   poly16x8_t __s0 = __p0; \
   9896   poly16x8_t __s1 = __p1; \
   9897   __ret = (poly16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \
   9898   __ret; \
   9899 })
   9900 #else
   9901 #define vextq_p16(__p0, __p1, __p2) __extension__ ({ \
   9902   poly16x8_t __ret; \
   9903   poly16x8_t __s0 = __p0; \
   9904   poly16x8_t __s1 = __p1; \
   9905   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   9906   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
   9907   __ret = (poly16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \
   9908   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   9909   __ret; \
   9910 })
   9911 #endif
   9912 
   9913 #ifdef __LITTLE_ENDIAN__
   9914 #define vextq_u8(__p0, __p1, __p2) __extension__ ({ \
   9915   uint8x16_t __ret; \
   9916   uint8x16_t __s0 = __p0; \
   9917   uint8x16_t __s1 = __p1; \
   9918   __ret = (uint8x16_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
   9919   __ret; \
   9920 })
   9921 #else
   9922 #define vextq_u8(__p0, __p1, __p2) __extension__ ({ \
   9923   uint8x16_t __ret; \
   9924   uint8x16_t __s0 = __p0; \
   9925   uint8x16_t __s1 = __p1; \
   9926   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   9927   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   9928   __ret = (uint8x16_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
   9929   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
   9930   __ret; \
   9931 })
   9932 #endif
   9933 
   9934 #ifdef __LITTLE_ENDIAN__
   9935 #define vextq_u32(__p0, __p1, __p2) __extension__ ({ \
   9936   uint32x4_t __ret; \
   9937   uint32x4_t __s0 = __p0; \
   9938   uint32x4_t __s1 = __p1; \
   9939   __ret = (uint32x4_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \
   9940   __ret; \
   9941 })
   9942 #else
   9943 #define vextq_u32(__p0, __p1, __p2) __extension__ ({ \
   9944   uint32x4_t __ret; \
   9945   uint32x4_t __s0 = __p0; \
   9946   uint32x4_t __s1 = __p1; \
   9947   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
   9948   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
   9949   __ret = (uint32x4_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \
   9950   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
   9951   __ret; \
   9952 })
   9953 #endif
   9954 
   9955 #ifdef __LITTLE_ENDIAN__
   9956 #define vextq_u64(__p0, __p1, __p2) __extension__ ({ \
   9957   uint64x2_t __ret; \
   9958   uint64x2_t __s0 = __p0; \
   9959   uint64x2_t __s1 = __p1; \
   9960   __ret = (uint64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \
   9961   __ret; \
   9962 })
   9963 #else
   9964 #define vextq_u64(__p0, __p1, __p2) __extension__ ({ \
   9965   uint64x2_t __ret; \
   9966   uint64x2_t __s0 = __p0; \
   9967   uint64x2_t __s1 = __p1; \
   9968   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
   9969   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
   9970   __ret = (uint64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \
   9971   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
   9972   __ret; \
   9973 })
   9974 #endif
   9975 
   9976 #ifdef __LITTLE_ENDIAN__
   9977 #define vextq_u16(__p0, __p1, __p2) __extension__ ({ \
   9978   uint16x8_t __ret; \
   9979   uint16x8_t __s0 = __p0; \
   9980   uint16x8_t __s1 = __p1; \
   9981   __ret = (uint16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \
   9982   __ret; \
   9983 })
   9984 #else
   9985 #define vextq_u16(__p0, __p1, __p2) __extension__ ({ \
   9986   uint16x8_t __ret; \
   9987   uint16x8_t __s0 = __p0; \
   9988   uint16x8_t __s1 = __p1; \
   9989   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
   9990   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
   9991   __ret = (uint16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
   9992   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
   9993   __ret; \
   9994 })
   9995 #endif
   9996 
   9997 #ifdef __LITTLE_ENDIAN__
   9998 #define vextq_s8(__p0, __p1, __p2) __extension__ ({ \
   9999   int8x16_t __ret; \
  10000   int8x16_t __s0 = __p0; \
  10001   int8x16_t __s1 = __p1; \
  10002   __ret = (int8x16_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  10003   __ret; \
  10004 })
  10005 #else
  10006 #define vextq_s8(__p0, __p1, __p2) __extension__ ({ \
  10007   int8x16_t __ret; \
  10008   int8x16_t __s0 = __p0; \
  10009   int8x16_t __s1 = __p1; \
  10010   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  10011   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  10012   __ret = (int8x16_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  10013   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  10014   __ret; \
  10015 })
  10016 #endif
  10017 
  10018 #ifdef __LITTLE_ENDIAN__
  10019 #define vextq_f32(__p0, __p1, __p2) __extension__ ({ \
  10020   float32x4_t __ret; \
  10021   float32x4_t __s0 = __p0; \
  10022   float32x4_t __s1 = __p1; \
  10023   __ret = (float32x4_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 41); \
  10024   __ret; \
  10025 })
  10026 #else
  10027 #define vextq_f32(__p0, __p1, __p2) __extension__ ({ \
  10028   float32x4_t __ret; \
  10029   float32x4_t __s0 = __p0; \
  10030   float32x4_t __s1 = __p1; \
  10031   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10032   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  10033   __ret = (float32x4_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 41); \
  10034   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  10035   __ret; \
  10036 })
  10037 #endif
  10038 
  10039 #ifdef __LITTLE_ENDIAN__
  10040 #define vextq_s32(__p0, __p1, __p2) __extension__ ({ \
  10041   int32x4_t __ret; \
  10042   int32x4_t __s0 = __p0; \
  10043   int32x4_t __s1 = __p1; \
  10044   __ret = (int32x4_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  10045   __ret; \
  10046 })
  10047 #else
  10048 #define vextq_s32(__p0, __p1, __p2) __extension__ ({ \
  10049   int32x4_t __ret; \
  10050   int32x4_t __s0 = __p0; \
  10051   int32x4_t __s1 = __p1; \
  10052   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10053   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  10054   __ret = (int32x4_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  10055   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  10056   __ret; \
  10057 })
  10058 #endif
  10059 
  10060 #ifdef __LITTLE_ENDIAN__
  10061 #define vextq_s64(__p0, __p1, __p2) __extension__ ({ \
  10062   int64x2_t __ret; \
  10063   int64x2_t __s0 = __p0; \
  10064   int64x2_t __s1 = __p1; \
  10065   __ret = (int64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \
  10066   __ret; \
  10067 })
  10068 #else
  10069 #define vextq_s64(__p0, __p1, __p2) __extension__ ({ \
  10070   int64x2_t __ret; \
  10071   int64x2_t __s0 = __p0; \
  10072   int64x2_t __s1 = __p1; \
  10073   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10074   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  10075   __ret = (int64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \
  10076   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  10077   __ret; \
  10078 })
  10079 #endif
  10080 
  10081 #ifdef __LITTLE_ENDIAN__
  10082 #define vextq_s16(__p0, __p1, __p2) __extension__ ({ \
  10083   int16x8_t __ret; \
  10084   int16x8_t __s0 = __p0; \
  10085   int16x8_t __s1 = __p1; \
  10086   __ret = (int16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  10087   __ret; \
  10088 })
  10089 #else
  10090 #define vextq_s16(__p0, __p1, __p2) __extension__ ({ \
  10091   int16x8_t __ret; \
  10092   int16x8_t __s0 = __p0; \
  10093   int16x8_t __s1 = __p1; \
  10094   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10095   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  10096   __ret = (int16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  10097   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  10098   __ret; \
  10099 })
  10100 #endif
  10101 
  10102 #ifdef __LITTLE_ENDIAN__
  10103 #define vext_u8(__p0, __p1, __p2) __extension__ ({ \
  10104   uint8x8_t __ret; \
  10105   uint8x8_t __s0 = __p0; \
  10106   uint8x8_t __s1 = __p1; \
  10107   __ret = (uint8x8_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \
  10108   __ret; \
  10109 })
  10110 #else
  10111 #define vext_u8(__p0, __p1, __p2) __extension__ ({ \
  10112   uint8x8_t __ret; \
  10113   uint8x8_t __s0 = __p0; \
  10114   uint8x8_t __s1 = __p1; \
  10115   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10116   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  10117   __ret = (uint8x8_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \
  10118   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  10119   __ret; \
  10120 })
  10121 #endif
  10122 
  10123 #ifdef __LITTLE_ENDIAN__
  10124 #define vext_u32(__p0, __p1, __p2) __extension__ ({ \
  10125   uint32x2_t __ret; \
  10126   uint32x2_t __s0 = __p0; \
  10127   uint32x2_t __s1 = __p1; \
  10128   __ret = (uint32x2_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \
  10129   __ret; \
  10130 })
  10131 #else
  10132 #define vext_u32(__p0, __p1, __p2) __extension__ ({ \
  10133   uint32x2_t __ret; \
  10134   uint32x2_t __s0 = __p0; \
  10135   uint32x2_t __s1 = __p1; \
  10136   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10137   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  10138   __ret = (uint32x2_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \
  10139   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  10140   __ret; \
  10141 })
  10142 #endif
  10143 
  10144 #define vext_u64(__p0, __p1, __p2) __extension__ ({ \
  10145   uint64x1_t __ret; \
  10146   uint64x1_t __s0 = __p0; \
  10147   uint64x1_t __s1 = __p1; \
  10148   __ret = (uint64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \
  10149   __ret; \
  10150 })
  10151 #ifdef __LITTLE_ENDIAN__
  10152 #define vext_u16(__p0, __p1, __p2) __extension__ ({ \
  10153   uint16x4_t __ret; \
  10154   uint16x4_t __s0 = __p0; \
  10155   uint16x4_t __s1 = __p1; \
  10156   __ret = (uint16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \
  10157   __ret; \
  10158 })
  10159 #else
  10160 #define vext_u16(__p0, __p1, __p2) __extension__ ({ \
  10161   uint16x4_t __ret; \
  10162   uint16x4_t __s0 = __p0; \
  10163   uint16x4_t __s1 = __p1; \
  10164   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10165   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  10166   __ret = (uint16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \
  10167   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  10168   __ret; \
  10169 })
  10170 #endif
  10171 
  10172 #ifdef __LITTLE_ENDIAN__
  10173 #define vext_s8(__p0, __p1, __p2) __extension__ ({ \
  10174   int8x8_t __ret; \
  10175   int8x8_t __s0 = __p0; \
  10176   int8x8_t __s1 = __p1; \
  10177   __ret = (int8x8_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \
  10178   __ret; \
  10179 })
  10180 #else
  10181 #define vext_s8(__p0, __p1, __p2) __extension__ ({ \
  10182   int8x8_t __ret; \
  10183   int8x8_t __s0 = __p0; \
  10184   int8x8_t __s1 = __p1; \
  10185   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10186   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  10187   __ret = (int8x8_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \
  10188   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  10189   __ret; \
  10190 })
  10191 #endif
  10192 
  10193 #ifdef __LITTLE_ENDIAN__
  10194 #define vext_f32(__p0, __p1, __p2) __extension__ ({ \
  10195   float32x2_t __ret; \
  10196   float32x2_t __s0 = __p0; \
  10197   float32x2_t __s1 = __p1; \
  10198   __ret = (float32x2_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 9); \
  10199   __ret; \
  10200 })
  10201 #else
  10202 #define vext_f32(__p0, __p1, __p2) __extension__ ({ \
  10203   float32x2_t __ret; \
  10204   float32x2_t __s0 = __p0; \
  10205   float32x2_t __s1 = __p1; \
  10206   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10207   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  10208   __ret = (float32x2_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 9); \
  10209   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  10210   __ret; \
  10211 })
  10212 #endif
  10213 
  10214 #ifdef __LITTLE_ENDIAN__
  10215 #define vext_s32(__p0, __p1, __p2) __extension__ ({ \
  10216   int32x2_t __ret; \
  10217   int32x2_t __s0 = __p0; \
  10218   int32x2_t __s1 = __p1; \
  10219   __ret = (int32x2_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  10220   __ret; \
  10221 })
  10222 #else
  10223 #define vext_s32(__p0, __p1, __p2) __extension__ ({ \
  10224   int32x2_t __ret; \
  10225   int32x2_t __s0 = __p0; \
  10226   int32x2_t __s1 = __p1; \
  10227   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10228   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  10229   __ret = (int32x2_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  10230   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  10231   __ret; \
  10232 })
  10233 #endif
  10234 
  10235 #define vext_s64(__p0, __p1, __p2) __extension__ ({ \
  10236   int64x1_t __ret; \
  10237   int64x1_t __s0 = __p0; \
  10238   int64x1_t __s1 = __p1; \
  10239   __ret = (int64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \
  10240   __ret; \
  10241 })
  10242 #ifdef __LITTLE_ENDIAN__
  10243 #define vext_s16(__p0, __p1, __p2) __extension__ ({ \
  10244   int16x4_t __ret; \
  10245   int16x4_t __s0 = __p0; \
  10246   int16x4_t __s1 = __p1; \
  10247   __ret = (int16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  10248   __ret; \
  10249 })
  10250 #else
  10251 #define vext_s16(__p0, __p1, __p2) __extension__ ({ \
  10252   int16x4_t __ret; \
  10253   int16x4_t __s0 = __p0; \
  10254   int16x4_t __s1 = __p1; \
  10255   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10256   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  10257   __ret = (int16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  10258   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  10259   __ret; \
  10260 })
  10261 #endif
  10262 
  10263 #ifdef __LITTLE_ENDIAN__
  10264 #define vextq_f16(__p0, __p1, __p2) __extension__ ({ \
  10265   float16x8_t __ret; \
  10266   float16x8_t __s0 = __p0; \
  10267   float16x8_t __s1 = __p1; \
  10268   __ret = (float16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 40); \
  10269   __ret; \
  10270 })
  10271 #else
  10272 #define vextq_f16(__p0, __p1, __p2) __extension__ ({ \
  10273   float16x8_t __ret; \
  10274   float16x8_t __s0 = __p0; \
  10275   float16x8_t __s1 = __p1; \
  10276   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10277   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  10278   __ret = (float16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 40); \
  10279   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  10280   __ret; \
  10281 })
  10282 #endif
  10283 
  10284 #ifdef __LITTLE_ENDIAN__
  10285 #define vext_f16(__p0, __p1, __p2) __extension__ ({ \
  10286   float16x4_t __ret; \
  10287   float16x4_t __s0 = __p0; \
  10288   float16x4_t __s1 = __p1; \
  10289   __ret = (float16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 8); \
  10290   __ret; \
  10291 })
  10292 #else
  10293 #define vext_f16(__p0, __p1, __p2) __extension__ ({ \
  10294   float16x4_t __ret; \
  10295   float16x4_t __s0 = __p0; \
  10296   float16x4_t __s1 = __p1; \
  10297   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10298   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  10299   __ret = (float16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 8); \
  10300   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  10301   __ret; \
  10302 })
  10303 #endif
  10304 
  10305 #ifdef __LITTLE_ENDIAN__
  10306 __ai __attribute__((target("neon"))) poly8x8_t vget_high_p8(poly8x16_t __p0) {
  10307   poly8x8_t __ret;
  10308   __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15);
  10309   return __ret;
  10310 }
  10311 #else
  10312 __ai __attribute__((target("neon"))) poly8x8_t vget_high_p8(poly8x16_t __p0) {
  10313   poly8x8_t __ret;
  10314   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  10315   __ret = __builtin_shufflevector(__rev0, __rev0, 8, 9, 10, 11, 12, 13, 14, 15);
  10316   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  10317   return __ret;
  10318 }
  10319 __ai __attribute__((target("neon"))) poly8x8_t __noswap_vget_high_p8(poly8x16_t __p0) {
  10320   poly8x8_t __ret;
  10321   __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15);
  10322   return __ret;
  10323 }
  10324 #endif
  10325 
  10326 #ifdef __LITTLE_ENDIAN__
  10327 __ai __attribute__((target("neon"))) poly16x4_t vget_high_p16(poly16x8_t __p0) {
  10328   poly16x4_t __ret;
  10329   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10330   return __ret;
  10331 }
  10332 #else
  10333 __ai __attribute__((target("neon"))) poly16x4_t vget_high_p16(poly16x8_t __p0) {
  10334   poly16x4_t __ret;
  10335   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  10336   __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7);
  10337   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  10338   return __ret;
  10339 }
  10340 #endif
  10341 
  10342 #ifdef __LITTLE_ENDIAN__
  10343 __ai __attribute__((target("neon"))) uint8x8_t vget_high_u8(uint8x16_t __p0) {
  10344   uint8x8_t __ret;
  10345   __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15);
  10346   return __ret;
  10347 }
  10348 #else
  10349 __ai __attribute__((target("neon"))) uint8x8_t vget_high_u8(uint8x16_t __p0) {
  10350   uint8x8_t __ret;
  10351   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  10352   __ret = __builtin_shufflevector(__rev0, __rev0, 8, 9, 10, 11, 12, 13, 14, 15);
  10353   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  10354   return __ret;
  10355 }
  10356 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vget_high_u8(uint8x16_t __p0) {
  10357   uint8x8_t __ret;
  10358   __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15);
  10359   return __ret;
  10360 }
  10361 #endif
  10362 
  10363 #ifdef __LITTLE_ENDIAN__
  10364 __ai __attribute__((target("neon"))) uint32x2_t vget_high_u32(uint32x4_t __p0) {
  10365   uint32x2_t __ret;
  10366   __ret = __builtin_shufflevector(__p0, __p0, 2, 3);
  10367   return __ret;
  10368 }
  10369 #else
  10370 __ai __attribute__((target("neon"))) uint32x2_t vget_high_u32(uint32x4_t __p0) {
  10371   uint32x2_t __ret;
  10372   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  10373   __ret = __builtin_shufflevector(__rev0, __rev0, 2, 3);
  10374   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  10375   return __ret;
  10376 }
  10377 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vget_high_u32(uint32x4_t __p0) {
  10378   uint32x2_t __ret;
  10379   __ret = __builtin_shufflevector(__p0, __p0, 2, 3);
  10380   return __ret;
  10381 }
  10382 #endif
  10383 
  10384 #ifdef __LITTLE_ENDIAN__
  10385 __ai __attribute__((target("neon"))) uint64x1_t vget_high_u64(uint64x2_t __p0) {
  10386   uint64x1_t __ret;
  10387   __ret = __builtin_shufflevector(__p0, __p0, 1);
  10388   return __ret;
  10389 }
  10390 #else
  10391 __ai __attribute__((target("neon"))) uint64x1_t vget_high_u64(uint64x2_t __p0) {
  10392   uint64x1_t __ret;
  10393   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  10394   __ret = __builtin_shufflevector(__rev0, __rev0, 1);
  10395   return __ret;
  10396 }
  10397 #endif
  10398 
  10399 #ifdef __LITTLE_ENDIAN__
  10400 __ai __attribute__((target("neon"))) uint16x4_t vget_high_u16(uint16x8_t __p0) {
  10401   uint16x4_t __ret;
  10402   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10403   return __ret;
  10404 }
  10405 #else
  10406 __ai __attribute__((target("neon"))) uint16x4_t vget_high_u16(uint16x8_t __p0) {
  10407   uint16x4_t __ret;
  10408   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  10409   __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7);
  10410   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  10411   return __ret;
  10412 }
  10413 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vget_high_u16(uint16x8_t __p0) {
  10414   uint16x4_t __ret;
  10415   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10416   return __ret;
  10417 }
  10418 #endif
  10419 
  10420 #ifdef __LITTLE_ENDIAN__
  10421 __ai __attribute__((target("neon"))) int8x8_t vget_high_s8(int8x16_t __p0) {
  10422   int8x8_t __ret;
  10423   __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15);
  10424   return __ret;
  10425 }
  10426 #else
  10427 __ai __attribute__((target("neon"))) int8x8_t vget_high_s8(int8x16_t __p0) {
  10428   int8x8_t __ret;
  10429   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  10430   __ret = __builtin_shufflevector(__rev0, __rev0, 8, 9, 10, 11, 12, 13, 14, 15);
  10431   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  10432   return __ret;
  10433 }
  10434 __ai __attribute__((target("neon"))) int8x8_t __noswap_vget_high_s8(int8x16_t __p0) {
  10435   int8x8_t __ret;
  10436   __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15);
  10437   return __ret;
  10438 }
  10439 #endif
  10440 
  10441 #ifdef __LITTLE_ENDIAN__
  10442 __ai __attribute__((target("neon"))) float32x2_t vget_high_f32(float32x4_t __p0) {
  10443   float32x2_t __ret;
  10444   __ret = __builtin_shufflevector(__p0, __p0, 2, 3);
  10445   return __ret;
  10446 }
  10447 #else
  10448 __ai __attribute__((target("neon"))) float32x2_t vget_high_f32(float32x4_t __p0) {
  10449   float32x2_t __ret;
  10450   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  10451   __ret = __builtin_shufflevector(__rev0, __rev0, 2, 3);
  10452   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  10453   return __ret;
  10454 }
  10455 __ai __attribute__((target("neon"))) float32x2_t __noswap_vget_high_f32(float32x4_t __p0) {
  10456   float32x2_t __ret;
  10457   __ret = __builtin_shufflevector(__p0, __p0, 2, 3);
  10458   return __ret;
  10459 }
  10460 #endif
  10461 
  10462 #ifdef __LITTLE_ENDIAN__
  10463 __ai __attribute__((target("neon"))) float16x4_t vget_high_f16(float16x8_t __p0) {
  10464   float16x4_t __ret;
  10465   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10466   return __ret;
  10467 }
  10468 #else
  10469 __ai __attribute__((target("neon"))) float16x4_t vget_high_f16(float16x8_t __p0) {
  10470   float16x4_t __ret;
  10471   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  10472   __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7);
  10473   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  10474   return __ret;
  10475 }
  10476 __ai __attribute__((target("neon"))) float16x4_t __noswap_vget_high_f16(float16x8_t __p0) {
  10477   float16x4_t __ret;
  10478   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10479   return __ret;
  10480 }
  10481 #endif
  10482 
  10483 #ifdef __LITTLE_ENDIAN__
  10484 __ai __attribute__((target("neon"))) int32x2_t vget_high_s32(int32x4_t __p0) {
  10485   int32x2_t __ret;
  10486   __ret = __builtin_shufflevector(__p0, __p0, 2, 3);
  10487   return __ret;
  10488 }
  10489 #else
  10490 __ai __attribute__((target("neon"))) int32x2_t vget_high_s32(int32x4_t __p0) {
  10491   int32x2_t __ret;
  10492   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  10493   __ret = __builtin_shufflevector(__rev0, __rev0, 2, 3);
  10494   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  10495   return __ret;
  10496 }
  10497 __ai __attribute__((target("neon"))) int32x2_t __noswap_vget_high_s32(int32x4_t __p0) {
  10498   int32x2_t __ret;
  10499   __ret = __builtin_shufflevector(__p0, __p0, 2, 3);
  10500   return __ret;
  10501 }
  10502 #endif
  10503 
  10504 #ifdef __LITTLE_ENDIAN__
  10505 __ai __attribute__((target("neon"))) int64x1_t vget_high_s64(int64x2_t __p0) {
  10506   int64x1_t __ret;
  10507   __ret = __builtin_shufflevector(__p0, __p0, 1);
  10508   return __ret;
  10509 }
  10510 #else
  10511 __ai __attribute__((target("neon"))) int64x1_t vget_high_s64(int64x2_t __p0) {
  10512   int64x1_t __ret;
  10513   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  10514   __ret = __builtin_shufflevector(__rev0, __rev0, 1);
  10515   return __ret;
  10516 }
  10517 #endif
  10518 
  10519 #ifdef __LITTLE_ENDIAN__
  10520 __ai __attribute__((target("neon"))) int16x4_t vget_high_s16(int16x8_t __p0) {
  10521   int16x4_t __ret;
  10522   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10523   return __ret;
  10524 }
  10525 #else
  10526 __ai __attribute__((target("neon"))) int16x4_t vget_high_s16(int16x8_t __p0) {
  10527   int16x4_t __ret;
  10528   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  10529   __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7);
  10530   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  10531   return __ret;
  10532 }
  10533 __ai __attribute__((target("neon"))) int16x4_t __noswap_vget_high_s16(int16x8_t __p0) {
  10534   int16x4_t __ret;
  10535   __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7);
  10536   return __ret;
  10537 }
  10538 #endif
  10539 
  10540 #ifdef __LITTLE_ENDIAN__
  10541 #define vget_lane_p8(__p0, __p1) __extension__ ({ \
  10542   poly8_t __ret; \
  10543   poly8x8_t __s0 = __p0; \
  10544   __ret = (poly8_t) __builtin_neon_vget_lane_i8((poly8x8_t)__s0, __p1); \
  10545   __ret; \
  10546 })
  10547 #else
  10548 #define vget_lane_p8(__p0, __p1) __extension__ ({ \
  10549   poly8_t __ret; \
  10550   poly8x8_t __s0 = __p0; \
  10551   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10552   __ret = (poly8_t) __builtin_neon_vget_lane_i8((poly8x8_t)__rev0, __p1); \
  10553   __ret; \
  10554 })
  10555 #define __noswap_vget_lane_p8(__p0, __p1) __extension__ ({ \
  10556   poly8_t __ret; \
  10557   poly8x8_t __s0 = __p0; \
  10558   __ret = (poly8_t) __builtin_neon_vget_lane_i8((poly8x8_t)__s0, __p1); \
  10559   __ret; \
  10560 })
  10561 #endif
  10562 
  10563 #ifdef __LITTLE_ENDIAN__
  10564 #define vget_lane_p16(__p0, __p1) __extension__ ({ \
  10565   poly16_t __ret; \
  10566   poly16x4_t __s0 = __p0; \
  10567   __ret = (poly16_t) __builtin_neon_vget_lane_i16((poly16x4_t)__s0, __p1); \
  10568   __ret; \
  10569 })
  10570 #else
  10571 #define vget_lane_p16(__p0, __p1) __extension__ ({ \
  10572   poly16_t __ret; \
  10573   poly16x4_t __s0 = __p0; \
  10574   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10575   __ret = (poly16_t) __builtin_neon_vget_lane_i16((poly16x4_t)__rev0, __p1); \
  10576   __ret; \
  10577 })
  10578 #define __noswap_vget_lane_p16(__p0, __p1) __extension__ ({ \
  10579   poly16_t __ret; \
  10580   poly16x4_t __s0 = __p0; \
  10581   __ret = (poly16_t) __builtin_neon_vget_lane_i16((poly16x4_t)__s0, __p1); \
  10582   __ret; \
  10583 })
  10584 #endif
  10585 
  10586 #ifdef __LITTLE_ENDIAN__
  10587 #define vgetq_lane_p8(__p0, __p1) __extension__ ({ \
  10588   poly8_t __ret; \
  10589   poly8x16_t __s0 = __p0; \
  10590   __ret = (poly8_t) __builtin_neon_vgetq_lane_i8((poly8x16_t)__s0, __p1); \
  10591   __ret; \
  10592 })
  10593 #else
  10594 #define vgetq_lane_p8(__p0, __p1) __extension__ ({ \
  10595   poly8_t __ret; \
  10596   poly8x16_t __s0 = __p0; \
  10597   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  10598   __ret = (poly8_t) __builtin_neon_vgetq_lane_i8((poly8x16_t)__rev0, __p1); \
  10599   __ret; \
  10600 })
  10601 #define __noswap_vgetq_lane_p8(__p0, __p1) __extension__ ({ \
  10602   poly8_t __ret; \
  10603   poly8x16_t __s0 = __p0; \
  10604   __ret = (poly8_t) __builtin_neon_vgetq_lane_i8((poly8x16_t)__s0, __p1); \
  10605   __ret; \
  10606 })
  10607 #endif
  10608 
  10609 #ifdef __LITTLE_ENDIAN__
  10610 #define vgetq_lane_p16(__p0, __p1) __extension__ ({ \
  10611   poly16_t __ret; \
  10612   poly16x8_t __s0 = __p0; \
  10613   __ret = (poly16_t) __builtin_neon_vgetq_lane_i16((poly16x8_t)__s0, __p1); \
  10614   __ret; \
  10615 })
  10616 #else
  10617 #define vgetq_lane_p16(__p0, __p1) __extension__ ({ \
  10618   poly16_t __ret; \
  10619   poly16x8_t __s0 = __p0; \
  10620   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10621   __ret = (poly16_t) __builtin_neon_vgetq_lane_i16((poly16x8_t)__rev0, __p1); \
  10622   __ret; \
  10623 })
  10624 #define __noswap_vgetq_lane_p16(__p0, __p1) __extension__ ({ \
  10625   poly16_t __ret; \
  10626   poly16x8_t __s0 = __p0; \
  10627   __ret = (poly16_t) __builtin_neon_vgetq_lane_i16((poly16x8_t)__s0, __p1); \
  10628   __ret; \
  10629 })
  10630 #endif
  10631 
  10632 #ifdef __LITTLE_ENDIAN__
  10633 #define vgetq_lane_u8(__p0, __p1) __extension__ ({ \
  10634   uint8_t __ret; \
  10635   uint8x16_t __s0 = __p0; \
  10636   __ret = (uint8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \
  10637   __ret; \
  10638 })
  10639 #else
  10640 #define vgetq_lane_u8(__p0, __p1) __extension__ ({ \
  10641   uint8_t __ret; \
  10642   uint8x16_t __s0 = __p0; \
  10643   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  10644   __ret = (uint8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__rev0, __p1); \
  10645   __ret; \
  10646 })
  10647 #define __noswap_vgetq_lane_u8(__p0, __p1) __extension__ ({ \
  10648   uint8_t __ret; \
  10649   uint8x16_t __s0 = __p0; \
  10650   __ret = (uint8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \
  10651   __ret; \
  10652 })
  10653 #endif
  10654 
  10655 #ifdef __LITTLE_ENDIAN__
  10656 #define vgetq_lane_u32(__p0, __p1) __extension__ ({ \
  10657   uint32_t __ret; \
  10658   uint32x4_t __s0 = __p0; \
  10659   __ret = (uint32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \
  10660   __ret; \
  10661 })
  10662 #else
  10663 #define vgetq_lane_u32(__p0, __p1) __extension__ ({ \
  10664   uint32_t __ret; \
  10665   uint32x4_t __s0 = __p0; \
  10666   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10667   __ret = (uint32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__rev0, __p1); \
  10668   __ret; \
  10669 })
  10670 #define __noswap_vgetq_lane_u32(__p0, __p1) __extension__ ({ \
  10671   uint32_t __ret; \
  10672   uint32x4_t __s0 = __p0; \
  10673   __ret = (uint32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \
  10674   __ret; \
  10675 })
  10676 #endif
  10677 
  10678 #ifdef __LITTLE_ENDIAN__
  10679 #define vgetq_lane_u64(__p0, __p1) __extension__ ({ \
  10680   uint64_t __ret; \
  10681   uint64x2_t __s0 = __p0; \
  10682   __ret = (uint64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \
  10683   __ret; \
  10684 })
  10685 #else
  10686 #define vgetq_lane_u64(__p0, __p1) __extension__ ({ \
  10687   uint64_t __ret; \
  10688   uint64x2_t __s0 = __p0; \
  10689   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10690   __ret = (uint64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__rev0, __p1); \
  10691   __ret; \
  10692 })
  10693 #define __noswap_vgetq_lane_u64(__p0, __p1) __extension__ ({ \
  10694   uint64_t __ret; \
  10695   uint64x2_t __s0 = __p0; \
  10696   __ret = (uint64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \
  10697   __ret; \
  10698 })
  10699 #endif
  10700 
  10701 #ifdef __LITTLE_ENDIAN__
  10702 #define vgetq_lane_u16(__p0, __p1) __extension__ ({ \
  10703   uint16_t __ret; \
  10704   uint16x8_t __s0 = __p0; \
  10705   __ret = (uint16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \
  10706   __ret; \
  10707 })
  10708 #else
  10709 #define vgetq_lane_u16(__p0, __p1) __extension__ ({ \
  10710   uint16_t __ret; \
  10711   uint16x8_t __s0 = __p0; \
  10712   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10713   __ret = (uint16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__rev0, __p1); \
  10714   __ret; \
  10715 })
  10716 #define __noswap_vgetq_lane_u16(__p0, __p1) __extension__ ({ \
  10717   uint16_t __ret; \
  10718   uint16x8_t __s0 = __p0; \
  10719   __ret = (uint16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \
  10720   __ret; \
  10721 })
  10722 #endif
  10723 
  10724 #ifdef __LITTLE_ENDIAN__
  10725 #define vgetq_lane_s8(__p0, __p1) __extension__ ({ \
  10726   int8_t __ret; \
  10727   int8x16_t __s0 = __p0; \
  10728   __ret = (int8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \
  10729   __ret; \
  10730 })
  10731 #else
  10732 #define vgetq_lane_s8(__p0, __p1) __extension__ ({ \
  10733   int8_t __ret; \
  10734   int8x16_t __s0 = __p0; \
  10735   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  10736   __ret = (int8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__rev0, __p1); \
  10737   __ret; \
  10738 })
  10739 #define __noswap_vgetq_lane_s8(__p0, __p1) __extension__ ({ \
  10740   int8_t __ret; \
  10741   int8x16_t __s0 = __p0; \
  10742   __ret = (int8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \
  10743   __ret; \
  10744 })
  10745 #endif
  10746 
  10747 #ifdef __LITTLE_ENDIAN__
  10748 #define vgetq_lane_f32(__p0, __p1) __extension__ ({ \
  10749   float32_t __ret; \
  10750   float32x4_t __s0 = __p0; \
  10751   __ret = (float32_t) __builtin_neon_vgetq_lane_f32((float32x4_t)__s0, __p1); \
  10752   __ret; \
  10753 })
  10754 #else
  10755 #define vgetq_lane_f32(__p0, __p1) __extension__ ({ \
  10756   float32_t __ret; \
  10757   float32x4_t __s0 = __p0; \
  10758   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10759   __ret = (float32_t) __builtin_neon_vgetq_lane_f32((float32x4_t)__rev0, __p1); \
  10760   __ret; \
  10761 })
  10762 #define __noswap_vgetq_lane_f32(__p0, __p1) __extension__ ({ \
  10763   float32_t __ret; \
  10764   float32x4_t __s0 = __p0; \
  10765   __ret = (float32_t) __builtin_neon_vgetq_lane_f32((float32x4_t)__s0, __p1); \
  10766   __ret; \
  10767 })
  10768 #endif
  10769 
  10770 #ifdef __LITTLE_ENDIAN__
  10771 #define vgetq_lane_s32(__p0, __p1) __extension__ ({ \
  10772   int32_t __ret; \
  10773   int32x4_t __s0 = __p0; \
  10774   __ret = (int32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \
  10775   __ret; \
  10776 })
  10777 #else
  10778 #define vgetq_lane_s32(__p0, __p1) __extension__ ({ \
  10779   int32_t __ret; \
  10780   int32x4_t __s0 = __p0; \
  10781   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10782   __ret = (int32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__rev0, __p1); \
  10783   __ret; \
  10784 })
  10785 #define __noswap_vgetq_lane_s32(__p0, __p1) __extension__ ({ \
  10786   int32_t __ret; \
  10787   int32x4_t __s0 = __p0; \
  10788   __ret = (int32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \
  10789   __ret; \
  10790 })
  10791 #endif
  10792 
  10793 #ifdef __LITTLE_ENDIAN__
  10794 #define vgetq_lane_s64(__p0, __p1) __extension__ ({ \
  10795   int64_t __ret; \
  10796   int64x2_t __s0 = __p0; \
  10797   __ret = (int64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \
  10798   __ret; \
  10799 })
  10800 #else
  10801 #define vgetq_lane_s64(__p0, __p1) __extension__ ({ \
  10802   int64_t __ret; \
  10803   int64x2_t __s0 = __p0; \
  10804   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10805   __ret = (int64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__rev0, __p1); \
  10806   __ret; \
  10807 })
  10808 #define __noswap_vgetq_lane_s64(__p0, __p1) __extension__ ({ \
  10809   int64_t __ret; \
  10810   int64x2_t __s0 = __p0; \
  10811   __ret = (int64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \
  10812   __ret; \
  10813 })
  10814 #endif
  10815 
  10816 #ifdef __LITTLE_ENDIAN__
  10817 #define vgetq_lane_s16(__p0, __p1) __extension__ ({ \
  10818   int16_t __ret; \
  10819   int16x8_t __s0 = __p0; \
  10820   __ret = (int16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \
  10821   __ret; \
  10822 })
  10823 #else
  10824 #define vgetq_lane_s16(__p0, __p1) __extension__ ({ \
  10825   int16_t __ret; \
  10826   int16x8_t __s0 = __p0; \
  10827   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10828   __ret = (int16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__rev0, __p1); \
  10829   __ret; \
  10830 })
  10831 #define __noswap_vgetq_lane_s16(__p0, __p1) __extension__ ({ \
  10832   int16_t __ret; \
  10833   int16x8_t __s0 = __p0; \
  10834   __ret = (int16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \
  10835   __ret; \
  10836 })
  10837 #endif
  10838 
  10839 #ifdef __LITTLE_ENDIAN__
  10840 #define vget_lane_u8(__p0, __p1) __extension__ ({ \
  10841   uint8_t __ret; \
  10842   uint8x8_t __s0 = __p0; \
  10843   __ret = (uint8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \
  10844   __ret; \
  10845 })
  10846 #else
  10847 #define vget_lane_u8(__p0, __p1) __extension__ ({ \
  10848   uint8_t __ret; \
  10849   uint8x8_t __s0 = __p0; \
  10850   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10851   __ret = (uint8_t) __builtin_neon_vget_lane_i8((int8x8_t)__rev0, __p1); \
  10852   __ret; \
  10853 })
  10854 #define __noswap_vget_lane_u8(__p0, __p1) __extension__ ({ \
  10855   uint8_t __ret; \
  10856   uint8x8_t __s0 = __p0; \
  10857   __ret = (uint8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \
  10858   __ret; \
  10859 })
  10860 #endif
  10861 
  10862 #ifdef __LITTLE_ENDIAN__
  10863 #define vget_lane_u32(__p0, __p1) __extension__ ({ \
  10864   uint32_t __ret; \
  10865   uint32x2_t __s0 = __p0; \
  10866   __ret = (uint32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \
  10867   __ret; \
  10868 })
  10869 #else
  10870 #define vget_lane_u32(__p0, __p1) __extension__ ({ \
  10871   uint32_t __ret; \
  10872   uint32x2_t __s0 = __p0; \
  10873   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10874   __ret = (uint32_t) __builtin_neon_vget_lane_i32((int32x2_t)__rev0, __p1); \
  10875   __ret; \
  10876 })
  10877 #define __noswap_vget_lane_u32(__p0, __p1) __extension__ ({ \
  10878   uint32_t __ret; \
  10879   uint32x2_t __s0 = __p0; \
  10880   __ret = (uint32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \
  10881   __ret; \
  10882 })
  10883 #endif
  10884 
  10885 #define vget_lane_u64(__p0, __p1) __extension__ ({ \
  10886   uint64_t __ret; \
  10887   uint64x1_t __s0 = __p0; \
  10888   __ret = (uint64_t) __builtin_neon_vget_lane_i64((int64x1_t)__s0, __p1); \
  10889   __ret; \
  10890 })
  10891 #ifdef __LITTLE_ENDIAN__
  10892 #define vget_lane_u16(__p0, __p1) __extension__ ({ \
  10893   uint16_t __ret; \
  10894   uint16x4_t __s0 = __p0; \
  10895   __ret = (uint16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \
  10896   __ret; \
  10897 })
  10898 #else
  10899 #define vget_lane_u16(__p0, __p1) __extension__ ({ \
  10900   uint16_t __ret; \
  10901   uint16x4_t __s0 = __p0; \
  10902   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  10903   __ret = (uint16_t) __builtin_neon_vget_lane_i16((int16x4_t)__rev0, __p1); \
  10904   __ret; \
  10905 })
  10906 #define __noswap_vget_lane_u16(__p0, __p1) __extension__ ({ \
  10907   uint16_t __ret; \
  10908   uint16x4_t __s0 = __p0; \
  10909   __ret = (uint16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \
  10910   __ret; \
  10911 })
  10912 #endif
  10913 
  10914 #ifdef __LITTLE_ENDIAN__
  10915 #define vget_lane_s8(__p0, __p1) __extension__ ({ \
  10916   int8_t __ret; \
  10917   int8x8_t __s0 = __p0; \
  10918   __ret = (int8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \
  10919   __ret; \
  10920 })
  10921 #else
  10922 #define vget_lane_s8(__p0, __p1) __extension__ ({ \
  10923   int8_t __ret; \
  10924   int8x8_t __s0 = __p0; \
  10925   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  10926   __ret = (int8_t) __builtin_neon_vget_lane_i8((int8x8_t)__rev0, __p1); \
  10927   __ret; \
  10928 })
  10929 #define __noswap_vget_lane_s8(__p0, __p1) __extension__ ({ \
  10930   int8_t __ret; \
  10931   int8x8_t __s0 = __p0; \
  10932   __ret = (int8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \
  10933   __ret; \
  10934 })
  10935 #endif
  10936 
  10937 #ifdef __LITTLE_ENDIAN__
  10938 #define vget_lane_f32(__p0, __p1) __extension__ ({ \
  10939   float32_t __ret; \
  10940   float32x2_t __s0 = __p0; \
  10941   __ret = (float32_t) __builtin_neon_vget_lane_f32((float32x2_t)__s0, __p1); \
  10942   __ret; \
  10943 })
  10944 #else
  10945 #define vget_lane_f32(__p0, __p1) __extension__ ({ \
  10946   float32_t __ret; \
  10947   float32x2_t __s0 = __p0; \
  10948   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10949   __ret = (float32_t) __builtin_neon_vget_lane_f32((float32x2_t)__rev0, __p1); \
  10950   __ret; \
  10951 })
  10952 #define __noswap_vget_lane_f32(__p0, __p1) __extension__ ({ \
  10953   float32_t __ret; \
  10954   float32x2_t __s0 = __p0; \
  10955   __ret = (float32_t) __builtin_neon_vget_lane_f32((float32x2_t)__s0, __p1); \
  10956   __ret; \
  10957 })
  10958 #endif
  10959 
  10960 #ifdef __LITTLE_ENDIAN__
  10961 #define vget_lane_s32(__p0, __p1) __extension__ ({ \
  10962   int32_t __ret; \
  10963   int32x2_t __s0 = __p0; \
  10964   __ret = (int32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \
  10965   __ret; \
  10966 })
  10967 #else
  10968 #define vget_lane_s32(__p0, __p1) __extension__ ({ \
  10969   int32_t __ret; \
  10970   int32x2_t __s0 = __p0; \
  10971   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  10972   __ret = (int32_t) __builtin_neon_vget_lane_i32((int32x2_t)__rev0, __p1); \
  10973   __ret; \
  10974 })
  10975 #define __noswap_vget_lane_s32(__p0, __p1) __extension__ ({ \
  10976   int32_t __ret; \
  10977   int32x2_t __s0 = __p0; \
  10978   __ret = (int32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \
  10979   __ret; \
  10980 })
  10981 #endif
  10982 
  10983 #define vget_lane_s64(__p0, __p1) __extension__ ({ \
  10984   int64_t __ret; \
  10985   int64x1_t __s0 = __p0; \
  10986   __ret = (int64_t) __builtin_neon_vget_lane_i64((int64x1_t)__s0, __p1); \
  10987   __ret; \
  10988 })
  10989 #ifdef __LITTLE_ENDIAN__
  10990 #define vget_lane_s16(__p0, __p1) __extension__ ({ \
  10991   int16_t __ret; \
  10992   int16x4_t __s0 = __p0; \
  10993   __ret = (int16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \
  10994   __ret; \
  10995 })
  10996 #else
  10997 #define vget_lane_s16(__p0, __p1) __extension__ ({ \
  10998   int16_t __ret; \
  10999   int16x4_t __s0 = __p0; \
  11000   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  11001   __ret = (int16_t) __builtin_neon_vget_lane_i16((int16x4_t)__rev0, __p1); \
  11002   __ret; \
  11003 })
  11004 #define __noswap_vget_lane_s16(__p0, __p1) __extension__ ({ \
  11005   int16_t __ret; \
  11006   int16x4_t __s0 = __p0; \
  11007   __ret = (int16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \
  11008   __ret; \
  11009 })
  11010 #endif
  11011 
  11012 #ifdef __LITTLE_ENDIAN__
  11013 __ai __attribute__((target("neon"))) poly8x8_t vget_low_p8(poly8x16_t __p0) {
  11014   poly8x8_t __ret;
  11015   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3, 4, 5, 6, 7);
  11016   return __ret;
  11017 }
  11018 #else
  11019 __ai __attribute__((target("neon"))) poly8x8_t vget_low_p8(poly8x16_t __p0) {
  11020   poly8x8_t __ret;
  11021   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11022   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3, 4, 5, 6, 7);
  11023   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11024   return __ret;
  11025 }
  11026 #endif
  11027 
  11028 #ifdef __LITTLE_ENDIAN__
  11029 __ai __attribute__((target("neon"))) poly16x4_t vget_low_p16(poly16x8_t __p0) {
  11030   poly16x4_t __ret;
  11031   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3);
  11032   return __ret;
  11033 }
  11034 #else
  11035 __ai __attribute__((target("neon"))) poly16x4_t vget_low_p16(poly16x8_t __p0) {
  11036   poly16x4_t __ret;
  11037   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11038   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3);
  11039   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11040   return __ret;
  11041 }
  11042 #endif
  11043 
  11044 #ifdef __LITTLE_ENDIAN__
  11045 __ai __attribute__((target("neon"))) uint8x8_t vget_low_u8(uint8x16_t __p0) {
  11046   uint8x8_t __ret;
  11047   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3, 4, 5, 6, 7);
  11048   return __ret;
  11049 }
  11050 #else
  11051 __ai __attribute__((target("neon"))) uint8x8_t vget_low_u8(uint8x16_t __p0) {
  11052   uint8x8_t __ret;
  11053   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11054   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3, 4, 5, 6, 7);
  11055   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11056   return __ret;
  11057 }
  11058 #endif
  11059 
  11060 #ifdef __LITTLE_ENDIAN__
  11061 __ai __attribute__((target("neon"))) uint32x2_t vget_low_u32(uint32x4_t __p0) {
  11062   uint32x2_t __ret;
  11063   __ret = __builtin_shufflevector(__p0, __p0, 0, 1);
  11064   return __ret;
  11065 }
  11066 #else
  11067 __ai __attribute__((target("neon"))) uint32x2_t vget_low_u32(uint32x4_t __p0) {
  11068   uint32x2_t __ret;
  11069   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11070   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1);
  11071   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11072   return __ret;
  11073 }
  11074 #endif
  11075 
  11076 #ifdef __LITTLE_ENDIAN__
  11077 __ai __attribute__((target("neon"))) uint64x1_t vget_low_u64(uint64x2_t __p0) {
  11078   uint64x1_t __ret;
  11079   __ret = __builtin_shufflevector(__p0, __p0, 0);
  11080   return __ret;
  11081 }
  11082 #else
  11083 __ai __attribute__((target("neon"))) uint64x1_t vget_low_u64(uint64x2_t __p0) {
  11084   uint64x1_t __ret;
  11085   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  11086   __ret = __builtin_shufflevector(__rev0, __rev0, 0);
  11087   return __ret;
  11088 }
  11089 #endif
  11090 
  11091 #ifdef __LITTLE_ENDIAN__
  11092 __ai __attribute__((target("neon"))) uint16x4_t vget_low_u16(uint16x8_t __p0) {
  11093   uint16x4_t __ret;
  11094   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3);
  11095   return __ret;
  11096 }
  11097 #else
  11098 __ai __attribute__((target("neon"))) uint16x4_t vget_low_u16(uint16x8_t __p0) {
  11099   uint16x4_t __ret;
  11100   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11101   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3);
  11102   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11103   return __ret;
  11104 }
  11105 #endif
  11106 
  11107 #ifdef __LITTLE_ENDIAN__
  11108 __ai __attribute__((target("neon"))) int8x8_t vget_low_s8(int8x16_t __p0) {
  11109   int8x8_t __ret;
  11110   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3, 4, 5, 6, 7);
  11111   return __ret;
  11112 }
  11113 #else
  11114 __ai __attribute__((target("neon"))) int8x8_t vget_low_s8(int8x16_t __p0) {
  11115   int8x8_t __ret;
  11116   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11117   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3, 4, 5, 6, 7);
  11118   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11119   return __ret;
  11120 }
  11121 #endif
  11122 
  11123 #ifdef __LITTLE_ENDIAN__
  11124 __ai __attribute__((target("neon"))) float32x2_t vget_low_f32(float32x4_t __p0) {
  11125   float32x2_t __ret;
  11126   __ret = __builtin_shufflevector(__p0, __p0, 0, 1);
  11127   return __ret;
  11128 }
  11129 #else
  11130 __ai __attribute__((target("neon"))) float32x2_t vget_low_f32(float32x4_t __p0) {
  11131   float32x2_t __ret;
  11132   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11133   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1);
  11134   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11135   return __ret;
  11136 }
  11137 #endif
  11138 
  11139 #ifdef __LITTLE_ENDIAN__
  11140 __ai __attribute__((target("neon"))) float16x4_t vget_low_f16(float16x8_t __p0) {
  11141   float16x4_t __ret;
  11142   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3);
  11143   return __ret;
  11144 }
  11145 #else
  11146 __ai __attribute__((target("neon"))) float16x4_t vget_low_f16(float16x8_t __p0) {
  11147   float16x4_t __ret;
  11148   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11149   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3);
  11150   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11151   return __ret;
  11152 }
  11153 #endif
  11154 
  11155 #ifdef __LITTLE_ENDIAN__
  11156 __ai __attribute__((target("neon"))) int32x2_t vget_low_s32(int32x4_t __p0) {
  11157   int32x2_t __ret;
  11158   __ret = __builtin_shufflevector(__p0, __p0, 0, 1);
  11159   return __ret;
  11160 }
  11161 #else
  11162 __ai __attribute__((target("neon"))) int32x2_t vget_low_s32(int32x4_t __p0) {
  11163   int32x2_t __ret;
  11164   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11165   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1);
  11166   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11167   return __ret;
  11168 }
  11169 #endif
  11170 
  11171 #ifdef __LITTLE_ENDIAN__
  11172 __ai __attribute__((target("neon"))) int64x1_t vget_low_s64(int64x2_t __p0) {
  11173   int64x1_t __ret;
  11174   __ret = __builtin_shufflevector(__p0, __p0, 0);
  11175   return __ret;
  11176 }
  11177 #else
  11178 __ai __attribute__((target("neon"))) int64x1_t vget_low_s64(int64x2_t __p0) {
  11179   int64x1_t __ret;
  11180   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  11181   __ret = __builtin_shufflevector(__rev0, __rev0, 0);
  11182   return __ret;
  11183 }
  11184 #endif
  11185 
  11186 #ifdef __LITTLE_ENDIAN__
  11187 __ai __attribute__((target("neon"))) int16x4_t vget_low_s16(int16x8_t __p0) {
  11188   int16x4_t __ret;
  11189   __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3);
  11190   return __ret;
  11191 }
  11192 #else
  11193 __ai __attribute__((target("neon"))) int16x4_t vget_low_s16(int16x8_t __p0) {
  11194   int16x4_t __ret;
  11195   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11196   __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3);
  11197   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11198   return __ret;
  11199 }
  11200 #endif
  11201 
  11202 #ifdef __LITTLE_ENDIAN__
  11203 __ai __attribute__((target("neon"))) uint8x16_t vhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  11204   uint8x16_t __ret;
  11205   __ret = (uint8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  11206   return __ret;
  11207 }
  11208 #else
  11209 __ai __attribute__((target("neon"))) uint8x16_t vhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  11210   uint8x16_t __ret;
  11211   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11212   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11213   __ret = (uint8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  11214   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11215   return __ret;
  11216 }
  11217 #endif
  11218 
  11219 #ifdef __LITTLE_ENDIAN__
  11220 __ai __attribute__((target("neon"))) uint32x4_t vhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  11221   uint32x4_t __ret;
  11222   __ret = (uint32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  11223   return __ret;
  11224 }
  11225 #else
  11226 __ai __attribute__((target("neon"))) uint32x4_t vhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  11227   uint32x4_t __ret;
  11228   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11229   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11230   __ret = (uint32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  11231   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11232   return __ret;
  11233 }
  11234 #endif
  11235 
  11236 #ifdef __LITTLE_ENDIAN__
  11237 __ai __attribute__((target("neon"))) uint16x8_t vhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  11238   uint16x8_t __ret;
  11239   __ret = (uint16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  11240   return __ret;
  11241 }
  11242 #else
  11243 __ai __attribute__((target("neon"))) uint16x8_t vhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  11244   uint16x8_t __ret;
  11245   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11246   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11247   __ret = (uint16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  11248   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11249   return __ret;
  11250 }
  11251 #endif
  11252 
  11253 #ifdef __LITTLE_ENDIAN__
  11254 __ai __attribute__((target("neon"))) int8x16_t vhaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  11255   int8x16_t __ret;
  11256   __ret = (int8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  11257   return __ret;
  11258 }
  11259 #else
  11260 __ai __attribute__((target("neon"))) int8x16_t vhaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  11261   int8x16_t __ret;
  11262   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11263   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11264   __ret = (int8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  11265   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11266   return __ret;
  11267 }
  11268 #endif
  11269 
  11270 #ifdef __LITTLE_ENDIAN__
  11271 __ai __attribute__((target("neon"))) int32x4_t vhaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  11272   int32x4_t __ret;
  11273   __ret = (int32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  11274   return __ret;
  11275 }
  11276 #else
  11277 __ai __attribute__((target("neon"))) int32x4_t vhaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  11278   int32x4_t __ret;
  11279   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11280   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11281   __ret = (int32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  11282   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11283   return __ret;
  11284 }
  11285 #endif
  11286 
  11287 #ifdef __LITTLE_ENDIAN__
  11288 __ai __attribute__((target("neon"))) int16x8_t vhaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  11289   int16x8_t __ret;
  11290   __ret = (int16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  11291   return __ret;
  11292 }
  11293 #else
  11294 __ai __attribute__((target("neon"))) int16x8_t vhaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  11295   int16x8_t __ret;
  11296   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11297   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11298   __ret = (int16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  11299   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11300   return __ret;
  11301 }
  11302 #endif
  11303 
  11304 #ifdef __LITTLE_ENDIAN__
  11305 __ai __attribute__((target("neon"))) uint8x8_t vhadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  11306   uint8x8_t __ret;
  11307   __ret = (uint8x8_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  11308   return __ret;
  11309 }
  11310 #else
  11311 __ai __attribute__((target("neon"))) uint8x8_t vhadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  11312   uint8x8_t __ret;
  11313   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11314   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11315   __ret = (uint8x8_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  11316   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11317   return __ret;
  11318 }
  11319 #endif
  11320 
  11321 #ifdef __LITTLE_ENDIAN__
  11322 __ai __attribute__((target("neon"))) uint32x2_t vhadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  11323   uint32x2_t __ret;
  11324   __ret = (uint32x2_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  11325   return __ret;
  11326 }
  11327 #else
  11328 __ai __attribute__((target("neon"))) uint32x2_t vhadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  11329   uint32x2_t __ret;
  11330   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  11331   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  11332   __ret = (uint32x2_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  11333   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11334   return __ret;
  11335 }
  11336 #endif
  11337 
  11338 #ifdef __LITTLE_ENDIAN__
  11339 __ai __attribute__((target("neon"))) uint16x4_t vhadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  11340   uint16x4_t __ret;
  11341   __ret = (uint16x4_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  11342   return __ret;
  11343 }
  11344 #else
  11345 __ai __attribute__((target("neon"))) uint16x4_t vhadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  11346   uint16x4_t __ret;
  11347   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11348   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11349   __ret = (uint16x4_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  11350   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11351   return __ret;
  11352 }
  11353 #endif
  11354 
  11355 #ifdef __LITTLE_ENDIAN__
  11356 __ai __attribute__((target("neon"))) int8x8_t vhadd_s8(int8x8_t __p0, int8x8_t __p1) {
  11357   int8x8_t __ret;
  11358   __ret = (int8x8_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  11359   return __ret;
  11360 }
  11361 #else
  11362 __ai __attribute__((target("neon"))) int8x8_t vhadd_s8(int8x8_t __p0, int8x8_t __p1) {
  11363   int8x8_t __ret;
  11364   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11365   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11366   __ret = (int8x8_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  11367   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11368   return __ret;
  11369 }
  11370 #endif
  11371 
  11372 #ifdef __LITTLE_ENDIAN__
  11373 __ai __attribute__((target("neon"))) int32x2_t vhadd_s32(int32x2_t __p0, int32x2_t __p1) {
  11374   int32x2_t __ret;
  11375   __ret = (int32x2_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  11376   return __ret;
  11377 }
  11378 #else
  11379 __ai __attribute__((target("neon"))) int32x2_t vhadd_s32(int32x2_t __p0, int32x2_t __p1) {
  11380   int32x2_t __ret;
  11381   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  11382   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  11383   __ret = (int32x2_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  11384   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11385   return __ret;
  11386 }
  11387 #endif
  11388 
  11389 #ifdef __LITTLE_ENDIAN__
  11390 __ai __attribute__((target("neon"))) int16x4_t vhadd_s16(int16x4_t __p0, int16x4_t __p1) {
  11391   int16x4_t __ret;
  11392   __ret = (int16x4_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  11393   return __ret;
  11394 }
  11395 #else
  11396 __ai __attribute__((target("neon"))) int16x4_t vhadd_s16(int16x4_t __p0, int16x4_t __p1) {
  11397   int16x4_t __ret;
  11398   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11399   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11400   __ret = (int16x4_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  11401   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11402   return __ret;
  11403 }
  11404 #endif
  11405 
  11406 #ifdef __LITTLE_ENDIAN__
  11407 __ai __attribute__((target("neon"))) uint8x16_t vhsubq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  11408   uint8x16_t __ret;
  11409   __ret = (uint8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  11410   return __ret;
  11411 }
  11412 #else
  11413 __ai __attribute__((target("neon"))) uint8x16_t vhsubq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  11414   uint8x16_t __ret;
  11415   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11416   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11417   __ret = (uint8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  11418   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11419   return __ret;
  11420 }
  11421 #endif
  11422 
  11423 #ifdef __LITTLE_ENDIAN__
  11424 __ai __attribute__((target("neon"))) uint32x4_t vhsubq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  11425   uint32x4_t __ret;
  11426   __ret = (uint32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  11427   return __ret;
  11428 }
  11429 #else
  11430 __ai __attribute__((target("neon"))) uint32x4_t vhsubq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  11431   uint32x4_t __ret;
  11432   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11433   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11434   __ret = (uint32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  11435   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11436   return __ret;
  11437 }
  11438 #endif
  11439 
  11440 #ifdef __LITTLE_ENDIAN__
  11441 __ai __attribute__((target("neon"))) uint16x8_t vhsubq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  11442   uint16x8_t __ret;
  11443   __ret = (uint16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  11444   return __ret;
  11445 }
  11446 #else
  11447 __ai __attribute__((target("neon"))) uint16x8_t vhsubq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  11448   uint16x8_t __ret;
  11449   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11450   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11451   __ret = (uint16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  11452   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11453   return __ret;
  11454 }
  11455 #endif
  11456 
  11457 #ifdef __LITTLE_ENDIAN__
  11458 __ai __attribute__((target("neon"))) int8x16_t vhsubq_s8(int8x16_t __p0, int8x16_t __p1) {
  11459   int8x16_t __ret;
  11460   __ret = (int8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  11461   return __ret;
  11462 }
  11463 #else
  11464 __ai __attribute__((target("neon"))) int8x16_t vhsubq_s8(int8x16_t __p0, int8x16_t __p1) {
  11465   int8x16_t __ret;
  11466   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11467   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11468   __ret = (int8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  11469   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  11470   return __ret;
  11471 }
  11472 #endif
  11473 
  11474 #ifdef __LITTLE_ENDIAN__
  11475 __ai __attribute__((target("neon"))) int32x4_t vhsubq_s32(int32x4_t __p0, int32x4_t __p1) {
  11476   int32x4_t __ret;
  11477   __ret = (int32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  11478   return __ret;
  11479 }
  11480 #else
  11481 __ai __attribute__((target("neon"))) int32x4_t vhsubq_s32(int32x4_t __p0, int32x4_t __p1) {
  11482   int32x4_t __ret;
  11483   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11484   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11485   __ret = (int32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  11486   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11487   return __ret;
  11488 }
  11489 #endif
  11490 
  11491 #ifdef __LITTLE_ENDIAN__
  11492 __ai __attribute__((target("neon"))) int16x8_t vhsubq_s16(int16x8_t __p0, int16x8_t __p1) {
  11493   int16x8_t __ret;
  11494   __ret = (int16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  11495   return __ret;
  11496 }
  11497 #else
  11498 __ai __attribute__((target("neon"))) int16x8_t vhsubq_s16(int16x8_t __p0, int16x8_t __p1) {
  11499   int16x8_t __ret;
  11500   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11501   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11502   __ret = (int16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  11503   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11504   return __ret;
  11505 }
  11506 #endif
  11507 
  11508 #ifdef __LITTLE_ENDIAN__
  11509 __ai __attribute__((target("neon"))) uint8x8_t vhsub_u8(uint8x8_t __p0, uint8x8_t __p1) {
  11510   uint8x8_t __ret;
  11511   __ret = (uint8x8_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  11512   return __ret;
  11513 }
  11514 #else
  11515 __ai __attribute__((target("neon"))) uint8x8_t vhsub_u8(uint8x8_t __p0, uint8x8_t __p1) {
  11516   uint8x8_t __ret;
  11517   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11518   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11519   __ret = (uint8x8_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  11520   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11521   return __ret;
  11522 }
  11523 #endif
  11524 
  11525 #ifdef __LITTLE_ENDIAN__
  11526 __ai __attribute__((target("neon"))) uint32x2_t vhsub_u32(uint32x2_t __p0, uint32x2_t __p1) {
  11527   uint32x2_t __ret;
  11528   __ret = (uint32x2_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  11529   return __ret;
  11530 }
  11531 #else
  11532 __ai __attribute__((target("neon"))) uint32x2_t vhsub_u32(uint32x2_t __p0, uint32x2_t __p1) {
  11533   uint32x2_t __ret;
  11534   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  11535   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  11536   __ret = (uint32x2_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  11537   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11538   return __ret;
  11539 }
  11540 #endif
  11541 
  11542 #ifdef __LITTLE_ENDIAN__
  11543 __ai __attribute__((target("neon"))) uint16x4_t vhsub_u16(uint16x4_t __p0, uint16x4_t __p1) {
  11544   uint16x4_t __ret;
  11545   __ret = (uint16x4_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  11546   return __ret;
  11547 }
  11548 #else
  11549 __ai __attribute__((target("neon"))) uint16x4_t vhsub_u16(uint16x4_t __p0, uint16x4_t __p1) {
  11550   uint16x4_t __ret;
  11551   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11552   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11553   __ret = (uint16x4_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  11554   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11555   return __ret;
  11556 }
  11557 #endif
  11558 
  11559 #ifdef __LITTLE_ENDIAN__
  11560 __ai __attribute__((target("neon"))) int8x8_t vhsub_s8(int8x8_t __p0, int8x8_t __p1) {
  11561   int8x8_t __ret;
  11562   __ret = (int8x8_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  11563   return __ret;
  11564 }
  11565 #else
  11566 __ai __attribute__((target("neon"))) int8x8_t vhsub_s8(int8x8_t __p0, int8x8_t __p1) {
  11567   int8x8_t __ret;
  11568   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  11569   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  11570   __ret = (int8x8_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  11571   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  11572   return __ret;
  11573 }
  11574 #endif
  11575 
  11576 #ifdef __LITTLE_ENDIAN__
  11577 __ai __attribute__((target("neon"))) int32x2_t vhsub_s32(int32x2_t __p0, int32x2_t __p1) {
  11578   int32x2_t __ret;
  11579   __ret = (int32x2_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  11580   return __ret;
  11581 }
  11582 #else
  11583 __ai __attribute__((target("neon"))) int32x2_t vhsub_s32(int32x2_t __p0, int32x2_t __p1) {
  11584   int32x2_t __ret;
  11585   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  11586   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  11587   __ret = (int32x2_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  11588   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  11589   return __ret;
  11590 }
  11591 #endif
  11592 
  11593 #ifdef __LITTLE_ENDIAN__
  11594 __ai __attribute__((target("neon"))) int16x4_t vhsub_s16(int16x4_t __p0, int16x4_t __p1) {
  11595   int16x4_t __ret;
  11596   __ret = (int16x4_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  11597   return __ret;
  11598 }
  11599 #else
  11600 __ai __attribute__((target("neon"))) int16x4_t vhsub_s16(int16x4_t __p0, int16x4_t __p1) {
  11601   int16x4_t __ret;
  11602   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  11603   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  11604   __ret = (int16x4_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  11605   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  11606   return __ret;
  11607 }
  11608 #endif
  11609 
  11610 #ifdef __LITTLE_ENDIAN__
  11611 #define vld1_p8(__p0) __extension__ ({ \
  11612   poly8x8_t __ret; \
  11613   __ret = (poly8x8_t) __builtin_neon_vld1_v(__p0, 4); \
  11614   __ret; \
  11615 })
  11616 #else
  11617 #define vld1_p8(__p0) __extension__ ({ \
  11618   poly8x8_t __ret; \
  11619   __ret = (poly8x8_t) __builtin_neon_vld1_v(__p0, 4); \
  11620   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11621   __ret; \
  11622 })
  11623 #endif
  11624 
  11625 #ifdef __LITTLE_ENDIAN__
  11626 #define vld1_p16(__p0) __extension__ ({ \
  11627   poly16x4_t __ret; \
  11628   __ret = (poly16x4_t) __builtin_neon_vld1_v(__p0, 5); \
  11629   __ret; \
  11630 })
  11631 #else
  11632 #define vld1_p16(__p0) __extension__ ({ \
  11633   poly16x4_t __ret; \
  11634   __ret = (poly16x4_t) __builtin_neon_vld1_v(__p0, 5); \
  11635   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11636   __ret; \
  11637 })
  11638 #endif
  11639 
  11640 #ifdef __LITTLE_ENDIAN__
  11641 #define vld1q_p8(__p0) __extension__ ({ \
  11642   poly8x16_t __ret; \
  11643   __ret = (poly8x16_t) __builtin_neon_vld1q_v(__p0, 36); \
  11644   __ret; \
  11645 })
  11646 #else
  11647 #define vld1q_p8(__p0) __extension__ ({ \
  11648   poly8x16_t __ret; \
  11649   __ret = (poly8x16_t) __builtin_neon_vld1q_v(__p0, 36); \
  11650   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  11651   __ret; \
  11652 })
  11653 #endif
  11654 
  11655 #ifdef __LITTLE_ENDIAN__
  11656 #define vld1q_p16(__p0) __extension__ ({ \
  11657   poly16x8_t __ret; \
  11658   __ret = (poly16x8_t) __builtin_neon_vld1q_v(__p0, 37); \
  11659   __ret; \
  11660 })
  11661 #else
  11662 #define vld1q_p16(__p0) __extension__ ({ \
  11663   poly16x8_t __ret; \
  11664   __ret = (poly16x8_t) __builtin_neon_vld1q_v(__p0, 37); \
  11665   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11666   __ret; \
  11667 })
  11668 #endif
  11669 
  11670 #ifdef __LITTLE_ENDIAN__
  11671 #define vld1q_u8(__p0) __extension__ ({ \
  11672   uint8x16_t __ret; \
  11673   __ret = (uint8x16_t) __builtin_neon_vld1q_v(__p0, 48); \
  11674   __ret; \
  11675 })
  11676 #else
  11677 #define vld1q_u8(__p0) __extension__ ({ \
  11678   uint8x16_t __ret; \
  11679   __ret = (uint8x16_t) __builtin_neon_vld1q_v(__p0, 48); \
  11680   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  11681   __ret; \
  11682 })
  11683 #endif
  11684 
  11685 #ifdef __LITTLE_ENDIAN__
  11686 #define vld1q_u32(__p0) __extension__ ({ \
  11687   uint32x4_t __ret; \
  11688   __ret = (uint32x4_t) __builtin_neon_vld1q_v(__p0, 50); \
  11689   __ret; \
  11690 })
  11691 #else
  11692 #define vld1q_u32(__p0) __extension__ ({ \
  11693   uint32x4_t __ret; \
  11694   __ret = (uint32x4_t) __builtin_neon_vld1q_v(__p0, 50); \
  11695   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11696   __ret; \
  11697 })
  11698 #endif
  11699 
  11700 #ifdef __LITTLE_ENDIAN__
  11701 #define vld1q_u64(__p0) __extension__ ({ \
  11702   uint64x2_t __ret; \
  11703   __ret = (uint64x2_t) __builtin_neon_vld1q_v(__p0, 51); \
  11704   __ret; \
  11705 })
  11706 #else
  11707 #define vld1q_u64(__p0) __extension__ ({ \
  11708   uint64x2_t __ret; \
  11709   __ret = (uint64x2_t) __builtin_neon_vld1q_v(__p0, 51); \
  11710   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  11711   __ret; \
  11712 })
  11713 #endif
  11714 
  11715 #ifdef __LITTLE_ENDIAN__
  11716 #define vld1q_u16(__p0) __extension__ ({ \
  11717   uint16x8_t __ret; \
  11718   __ret = (uint16x8_t) __builtin_neon_vld1q_v(__p0, 49); \
  11719   __ret; \
  11720 })
  11721 #else
  11722 #define vld1q_u16(__p0) __extension__ ({ \
  11723   uint16x8_t __ret; \
  11724   __ret = (uint16x8_t) __builtin_neon_vld1q_v(__p0, 49); \
  11725   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11726   __ret; \
  11727 })
  11728 #endif
  11729 
  11730 #ifdef __LITTLE_ENDIAN__
  11731 #define vld1q_s8(__p0) __extension__ ({ \
  11732   int8x16_t __ret; \
  11733   __ret = (int8x16_t) __builtin_neon_vld1q_v(__p0, 32); \
  11734   __ret; \
  11735 })
  11736 #else
  11737 #define vld1q_s8(__p0) __extension__ ({ \
  11738   int8x16_t __ret; \
  11739   __ret = (int8x16_t) __builtin_neon_vld1q_v(__p0, 32); \
  11740   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  11741   __ret; \
  11742 })
  11743 #endif
  11744 
  11745 #ifdef __LITTLE_ENDIAN__
  11746 #define vld1q_f32(__p0) __extension__ ({ \
  11747   float32x4_t __ret; \
  11748   __ret = (float32x4_t) __builtin_neon_vld1q_v(__p0, 41); \
  11749   __ret; \
  11750 })
  11751 #else
  11752 #define vld1q_f32(__p0) __extension__ ({ \
  11753   float32x4_t __ret; \
  11754   __ret = (float32x4_t) __builtin_neon_vld1q_v(__p0, 41); \
  11755   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11756   __ret; \
  11757 })
  11758 #endif
  11759 
  11760 #ifdef __LITTLE_ENDIAN__
  11761 #define vld1q_s32(__p0) __extension__ ({ \
  11762   int32x4_t __ret; \
  11763   __ret = (int32x4_t) __builtin_neon_vld1q_v(__p0, 34); \
  11764   __ret; \
  11765 })
  11766 #else
  11767 #define vld1q_s32(__p0) __extension__ ({ \
  11768   int32x4_t __ret; \
  11769   __ret = (int32x4_t) __builtin_neon_vld1q_v(__p0, 34); \
  11770   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11771   __ret; \
  11772 })
  11773 #endif
  11774 
  11775 #ifdef __LITTLE_ENDIAN__
  11776 #define vld1q_s64(__p0) __extension__ ({ \
  11777   int64x2_t __ret; \
  11778   __ret = (int64x2_t) __builtin_neon_vld1q_v(__p0, 35); \
  11779   __ret; \
  11780 })
  11781 #else
  11782 #define vld1q_s64(__p0) __extension__ ({ \
  11783   int64x2_t __ret; \
  11784   __ret = (int64x2_t) __builtin_neon_vld1q_v(__p0, 35); \
  11785   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  11786   __ret; \
  11787 })
  11788 #endif
  11789 
  11790 #ifdef __LITTLE_ENDIAN__
  11791 #define vld1q_s16(__p0) __extension__ ({ \
  11792   int16x8_t __ret; \
  11793   __ret = (int16x8_t) __builtin_neon_vld1q_v(__p0, 33); \
  11794   __ret; \
  11795 })
  11796 #else
  11797 #define vld1q_s16(__p0) __extension__ ({ \
  11798   int16x8_t __ret; \
  11799   __ret = (int16x8_t) __builtin_neon_vld1q_v(__p0, 33); \
  11800   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11801   __ret; \
  11802 })
  11803 #endif
  11804 
  11805 #ifdef __LITTLE_ENDIAN__
  11806 #define vld1_u8(__p0) __extension__ ({ \
  11807   uint8x8_t __ret; \
  11808   __ret = (uint8x8_t) __builtin_neon_vld1_v(__p0, 16); \
  11809   __ret; \
  11810 })
  11811 #else
  11812 #define vld1_u8(__p0) __extension__ ({ \
  11813   uint8x8_t __ret; \
  11814   __ret = (uint8x8_t) __builtin_neon_vld1_v(__p0, 16); \
  11815   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11816   __ret; \
  11817 })
  11818 #endif
  11819 
  11820 #ifdef __LITTLE_ENDIAN__
  11821 #define vld1_u32(__p0) __extension__ ({ \
  11822   uint32x2_t __ret; \
  11823   __ret = (uint32x2_t) __builtin_neon_vld1_v(__p0, 18); \
  11824   __ret; \
  11825 })
  11826 #else
  11827 #define vld1_u32(__p0) __extension__ ({ \
  11828   uint32x2_t __ret; \
  11829   __ret = (uint32x2_t) __builtin_neon_vld1_v(__p0, 18); \
  11830   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  11831   __ret; \
  11832 })
  11833 #endif
  11834 
  11835 #define vld1_u64(__p0) __extension__ ({ \
  11836   uint64x1_t __ret; \
  11837   __ret = (uint64x1_t) __builtin_neon_vld1_v(__p0, 19); \
  11838   __ret; \
  11839 })
  11840 #ifdef __LITTLE_ENDIAN__
  11841 #define vld1_u16(__p0) __extension__ ({ \
  11842   uint16x4_t __ret; \
  11843   __ret = (uint16x4_t) __builtin_neon_vld1_v(__p0, 17); \
  11844   __ret; \
  11845 })
  11846 #else
  11847 #define vld1_u16(__p0) __extension__ ({ \
  11848   uint16x4_t __ret; \
  11849   __ret = (uint16x4_t) __builtin_neon_vld1_v(__p0, 17); \
  11850   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11851   __ret; \
  11852 })
  11853 #endif
  11854 
  11855 #ifdef __LITTLE_ENDIAN__
  11856 #define vld1_s8(__p0) __extension__ ({ \
  11857   int8x8_t __ret; \
  11858   __ret = (int8x8_t) __builtin_neon_vld1_v(__p0, 0); \
  11859   __ret; \
  11860 })
  11861 #else
  11862 #define vld1_s8(__p0) __extension__ ({ \
  11863   int8x8_t __ret; \
  11864   __ret = (int8x8_t) __builtin_neon_vld1_v(__p0, 0); \
  11865   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11866   __ret; \
  11867 })
  11868 #endif
  11869 
  11870 #ifdef __LITTLE_ENDIAN__
  11871 #define vld1_f32(__p0) __extension__ ({ \
  11872   float32x2_t __ret; \
  11873   __ret = (float32x2_t) __builtin_neon_vld1_v(__p0, 9); \
  11874   __ret; \
  11875 })
  11876 #else
  11877 #define vld1_f32(__p0) __extension__ ({ \
  11878   float32x2_t __ret; \
  11879   __ret = (float32x2_t) __builtin_neon_vld1_v(__p0, 9); \
  11880   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  11881   __ret; \
  11882 })
  11883 #endif
  11884 
  11885 #ifdef __LITTLE_ENDIAN__
  11886 #define vld1_s32(__p0) __extension__ ({ \
  11887   int32x2_t __ret; \
  11888   __ret = (int32x2_t) __builtin_neon_vld1_v(__p0, 2); \
  11889   __ret; \
  11890 })
  11891 #else
  11892 #define vld1_s32(__p0) __extension__ ({ \
  11893   int32x2_t __ret; \
  11894   __ret = (int32x2_t) __builtin_neon_vld1_v(__p0, 2); \
  11895   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  11896   __ret; \
  11897 })
  11898 #endif
  11899 
  11900 #define vld1_s64(__p0) __extension__ ({ \
  11901   int64x1_t __ret; \
  11902   __ret = (int64x1_t) __builtin_neon_vld1_v(__p0, 3); \
  11903   __ret; \
  11904 })
  11905 #ifdef __LITTLE_ENDIAN__
  11906 #define vld1_s16(__p0) __extension__ ({ \
  11907   int16x4_t __ret; \
  11908   __ret = (int16x4_t) __builtin_neon_vld1_v(__p0, 1); \
  11909   __ret; \
  11910 })
  11911 #else
  11912 #define vld1_s16(__p0) __extension__ ({ \
  11913   int16x4_t __ret; \
  11914   __ret = (int16x4_t) __builtin_neon_vld1_v(__p0, 1); \
  11915   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11916   __ret; \
  11917 })
  11918 #endif
  11919 
  11920 #ifdef __LITTLE_ENDIAN__
  11921 #define vld1_dup_p8(__p0) __extension__ ({ \
  11922   poly8x8_t __ret; \
  11923   __ret = (poly8x8_t) __builtin_neon_vld1_dup_v(__p0, 4); \
  11924   __ret; \
  11925 })
  11926 #else
  11927 #define vld1_dup_p8(__p0) __extension__ ({ \
  11928   poly8x8_t __ret; \
  11929   __ret = (poly8x8_t) __builtin_neon_vld1_dup_v(__p0, 4); \
  11930   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11931   __ret; \
  11932 })
  11933 #endif
  11934 
  11935 #ifdef __LITTLE_ENDIAN__
  11936 #define vld1_dup_p16(__p0) __extension__ ({ \
  11937   poly16x4_t __ret; \
  11938   __ret = (poly16x4_t) __builtin_neon_vld1_dup_v(__p0, 5); \
  11939   __ret; \
  11940 })
  11941 #else
  11942 #define vld1_dup_p16(__p0) __extension__ ({ \
  11943   poly16x4_t __ret; \
  11944   __ret = (poly16x4_t) __builtin_neon_vld1_dup_v(__p0, 5); \
  11945   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  11946   __ret; \
  11947 })
  11948 #endif
  11949 
  11950 #ifdef __LITTLE_ENDIAN__
  11951 #define vld1q_dup_p8(__p0) __extension__ ({ \
  11952   poly8x16_t __ret; \
  11953   __ret = (poly8x16_t) __builtin_neon_vld1q_dup_v(__p0, 36); \
  11954   __ret; \
  11955 })
  11956 #else
  11957 #define vld1q_dup_p8(__p0) __extension__ ({ \
  11958   poly8x16_t __ret; \
  11959   __ret = (poly8x16_t) __builtin_neon_vld1q_dup_v(__p0, 36); \
  11960   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  11961   __ret; \
  11962 })
  11963 #endif
  11964 
  11965 #ifdef __LITTLE_ENDIAN__
  11966 #define vld1q_dup_p16(__p0) __extension__ ({ \
  11967   poly16x8_t __ret; \
  11968   __ret = (poly16x8_t) __builtin_neon_vld1q_dup_v(__p0, 37); \
  11969   __ret; \
  11970 })
  11971 #else
  11972 #define vld1q_dup_p16(__p0) __extension__ ({ \
  11973   poly16x8_t __ret; \
  11974   __ret = (poly16x8_t) __builtin_neon_vld1q_dup_v(__p0, 37); \
  11975   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  11976   __ret; \
  11977 })
  11978 #endif
  11979 
  11980 #ifdef __LITTLE_ENDIAN__
  11981 #define vld1q_dup_u8(__p0) __extension__ ({ \
  11982   uint8x16_t __ret; \
  11983   __ret = (uint8x16_t) __builtin_neon_vld1q_dup_v(__p0, 48); \
  11984   __ret; \
  11985 })
  11986 #else
  11987 #define vld1q_dup_u8(__p0) __extension__ ({ \
  11988   uint8x16_t __ret; \
  11989   __ret = (uint8x16_t) __builtin_neon_vld1q_dup_v(__p0, 48); \
  11990   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  11991   __ret; \
  11992 })
  11993 #endif
  11994 
  11995 #ifdef __LITTLE_ENDIAN__
  11996 #define vld1q_dup_u32(__p0) __extension__ ({ \
  11997   uint32x4_t __ret; \
  11998   __ret = (uint32x4_t) __builtin_neon_vld1q_dup_v(__p0, 50); \
  11999   __ret; \
  12000 })
  12001 #else
  12002 #define vld1q_dup_u32(__p0) __extension__ ({ \
  12003   uint32x4_t __ret; \
  12004   __ret = (uint32x4_t) __builtin_neon_vld1q_dup_v(__p0, 50); \
  12005   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12006   __ret; \
  12007 })
  12008 #endif
  12009 
  12010 #ifdef __LITTLE_ENDIAN__
  12011 #define vld1q_dup_u64(__p0) __extension__ ({ \
  12012   uint64x2_t __ret; \
  12013   __ret = (uint64x2_t) __builtin_neon_vld1q_dup_v(__p0, 51); \
  12014   __ret; \
  12015 })
  12016 #else
  12017 #define vld1q_dup_u64(__p0) __extension__ ({ \
  12018   uint64x2_t __ret; \
  12019   __ret = (uint64x2_t) __builtin_neon_vld1q_dup_v(__p0, 51); \
  12020   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12021   __ret; \
  12022 })
  12023 #endif
  12024 
  12025 #ifdef __LITTLE_ENDIAN__
  12026 #define vld1q_dup_u16(__p0) __extension__ ({ \
  12027   uint16x8_t __ret; \
  12028   __ret = (uint16x8_t) __builtin_neon_vld1q_dup_v(__p0, 49); \
  12029   __ret; \
  12030 })
  12031 #else
  12032 #define vld1q_dup_u16(__p0) __extension__ ({ \
  12033   uint16x8_t __ret; \
  12034   __ret = (uint16x8_t) __builtin_neon_vld1q_dup_v(__p0, 49); \
  12035   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12036   __ret; \
  12037 })
  12038 #endif
  12039 
  12040 #ifdef __LITTLE_ENDIAN__
  12041 #define vld1q_dup_s8(__p0) __extension__ ({ \
  12042   int8x16_t __ret; \
  12043   __ret = (int8x16_t) __builtin_neon_vld1q_dup_v(__p0, 32); \
  12044   __ret; \
  12045 })
  12046 #else
  12047 #define vld1q_dup_s8(__p0) __extension__ ({ \
  12048   int8x16_t __ret; \
  12049   __ret = (int8x16_t) __builtin_neon_vld1q_dup_v(__p0, 32); \
  12050   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12051   __ret; \
  12052 })
  12053 #endif
  12054 
  12055 #ifdef __LITTLE_ENDIAN__
  12056 #define vld1q_dup_f32(__p0) __extension__ ({ \
  12057   float32x4_t __ret; \
  12058   __ret = (float32x4_t) __builtin_neon_vld1q_dup_v(__p0, 41); \
  12059   __ret; \
  12060 })
  12061 #else
  12062 #define vld1q_dup_f32(__p0) __extension__ ({ \
  12063   float32x4_t __ret; \
  12064   __ret = (float32x4_t) __builtin_neon_vld1q_dup_v(__p0, 41); \
  12065   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12066   __ret; \
  12067 })
  12068 #endif
  12069 
  12070 #ifdef __LITTLE_ENDIAN__
  12071 #define vld1q_dup_s32(__p0) __extension__ ({ \
  12072   int32x4_t __ret; \
  12073   __ret = (int32x4_t) __builtin_neon_vld1q_dup_v(__p0, 34); \
  12074   __ret; \
  12075 })
  12076 #else
  12077 #define vld1q_dup_s32(__p0) __extension__ ({ \
  12078   int32x4_t __ret; \
  12079   __ret = (int32x4_t) __builtin_neon_vld1q_dup_v(__p0, 34); \
  12080   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12081   __ret; \
  12082 })
  12083 #endif
  12084 
  12085 #ifdef __LITTLE_ENDIAN__
  12086 #define vld1q_dup_s64(__p0) __extension__ ({ \
  12087   int64x2_t __ret; \
  12088   __ret = (int64x2_t) __builtin_neon_vld1q_dup_v(__p0, 35); \
  12089   __ret; \
  12090 })
  12091 #else
  12092 #define vld1q_dup_s64(__p0) __extension__ ({ \
  12093   int64x2_t __ret; \
  12094   __ret = (int64x2_t) __builtin_neon_vld1q_dup_v(__p0, 35); \
  12095   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12096   __ret; \
  12097 })
  12098 #endif
  12099 
  12100 #ifdef __LITTLE_ENDIAN__
  12101 #define vld1q_dup_s16(__p0) __extension__ ({ \
  12102   int16x8_t __ret; \
  12103   __ret = (int16x8_t) __builtin_neon_vld1q_dup_v(__p0, 33); \
  12104   __ret; \
  12105 })
  12106 #else
  12107 #define vld1q_dup_s16(__p0) __extension__ ({ \
  12108   int16x8_t __ret; \
  12109   __ret = (int16x8_t) __builtin_neon_vld1q_dup_v(__p0, 33); \
  12110   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12111   __ret; \
  12112 })
  12113 #endif
  12114 
  12115 #ifdef __LITTLE_ENDIAN__
  12116 #define vld1_dup_u8(__p0) __extension__ ({ \
  12117   uint8x8_t __ret; \
  12118   __ret = (uint8x8_t) __builtin_neon_vld1_dup_v(__p0, 16); \
  12119   __ret; \
  12120 })
  12121 #else
  12122 #define vld1_dup_u8(__p0) __extension__ ({ \
  12123   uint8x8_t __ret; \
  12124   __ret = (uint8x8_t) __builtin_neon_vld1_dup_v(__p0, 16); \
  12125   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12126   __ret; \
  12127 })
  12128 #endif
  12129 
  12130 #ifdef __LITTLE_ENDIAN__
  12131 #define vld1_dup_u32(__p0) __extension__ ({ \
  12132   uint32x2_t __ret; \
  12133   __ret = (uint32x2_t) __builtin_neon_vld1_dup_v(__p0, 18); \
  12134   __ret; \
  12135 })
  12136 #else
  12137 #define vld1_dup_u32(__p0) __extension__ ({ \
  12138   uint32x2_t __ret; \
  12139   __ret = (uint32x2_t) __builtin_neon_vld1_dup_v(__p0, 18); \
  12140   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12141   __ret; \
  12142 })
  12143 #endif
  12144 
  12145 #define vld1_dup_u64(__p0) __extension__ ({ \
  12146   uint64x1_t __ret; \
  12147   __ret = (uint64x1_t) __builtin_neon_vld1_dup_v(__p0, 19); \
  12148   __ret; \
  12149 })
  12150 #ifdef __LITTLE_ENDIAN__
  12151 #define vld1_dup_u16(__p0) __extension__ ({ \
  12152   uint16x4_t __ret; \
  12153   __ret = (uint16x4_t) __builtin_neon_vld1_dup_v(__p0, 17); \
  12154   __ret; \
  12155 })
  12156 #else
  12157 #define vld1_dup_u16(__p0) __extension__ ({ \
  12158   uint16x4_t __ret; \
  12159   __ret = (uint16x4_t) __builtin_neon_vld1_dup_v(__p0, 17); \
  12160   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12161   __ret; \
  12162 })
  12163 #endif
  12164 
  12165 #ifdef __LITTLE_ENDIAN__
  12166 #define vld1_dup_s8(__p0) __extension__ ({ \
  12167   int8x8_t __ret; \
  12168   __ret = (int8x8_t) __builtin_neon_vld1_dup_v(__p0, 0); \
  12169   __ret; \
  12170 })
  12171 #else
  12172 #define vld1_dup_s8(__p0) __extension__ ({ \
  12173   int8x8_t __ret; \
  12174   __ret = (int8x8_t) __builtin_neon_vld1_dup_v(__p0, 0); \
  12175   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12176   __ret; \
  12177 })
  12178 #endif
  12179 
  12180 #ifdef __LITTLE_ENDIAN__
  12181 #define vld1_dup_f32(__p0) __extension__ ({ \
  12182   float32x2_t __ret; \
  12183   __ret = (float32x2_t) __builtin_neon_vld1_dup_v(__p0, 9); \
  12184   __ret; \
  12185 })
  12186 #else
  12187 #define vld1_dup_f32(__p0) __extension__ ({ \
  12188   float32x2_t __ret; \
  12189   __ret = (float32x2_t) __builtin_neon_vld1_dup_v(__p0, 9); \
  12190   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12191   __ret; \
  12192 })
  12193 #endif
  12194 
  12195 #ifdef __LITTLE_ENDIAN__
  12196 #define vld1_dup_s32(__p0) __extension__ ({ \
  12197   int32x2_t __ret; \
  12198   __ret = (int32x2_t) __builtin_neon_vld1_dup_v(__p0, 2); \
  12199   __ret; \
  12200 })
  12201 #else
  12202 #define vld1_dup_s32(__p0) __extension__ ({ \
  12203   int32x2_t __ret; \
  12204   __ret = (int32x2_t) __builtin_neon_vld1_dup_v(__p0, 2); \
  12205   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12206   __ret; \
  12207 })
  12208 #endif
  12209 
  12210 #define vld1_dup_s64(__p0) __extension__ ({ \
  12211   int64x1_t __ret; \
  12212   __ret = (int64x1_t) __builtin_neon_vld1_dup_v(__p0, 3); \
  12213   __ret; \
  12214 })
  12215 #ifdef __LITTLE_ENDIAN__
  12216 #define vld1_dup_s16(__p0) __extension__ ({ \
  12217   int16x4_t __ret; \
  12218   __ret = (int16x4_t) __builtin_neon_vld1_dup_v(__p0, 1); \
  12219   __ret; \
  12220 })
  12221 #else
  12222 #define vld1_dup_s16(__p0) __extension__ ({ \
  12223   int16x4_t __ret; \
  12224   __ret = (int16x4_t) __builtin_neon_vld1_dup_v(__p0, 1); \
  12225   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12226   __ret; \
  12227 })
  12228 #endif
  12229 
  12230 #ifdef __LITTLE_ENDIAN__
  12231 #define vld1_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  12232   poly8x8_t __ret; \
  12233   poly8x8_t __s1 = __p1; \
  12234   __ret = (poly8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 4); \
  12235   __ret; \
  12236 })
  12237 #else
  12238 #define vld1_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  12239   poly8x8_t __ret; \
  12240   poly8x8_t __s1 = __p1; \
  12241   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  12242   __ret = (poly8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 4); \
  12243   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12244   __ret; \
  12245 })
  12246 #endif
  12247 
  12248 #ifdef __LITTLE_ENDIAN__
  12249 #define vld1_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  12250   poly16x4_t __ret; \
  12251   poly16x4_t __s1 = __p1; \
  12252   __ret = (poly16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 5); \
  12253   __ret; \
  12254 })
  12255 #else
  12256 #define vld1_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  12257   poly16x4_t __ret; \
  12258   poly16x4_t __s1 = __p1; \
  12259   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  12260   __ret = (poly16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 5); \
  12261   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12262   __ret; \
  12263 })
  12264 #endif
  12265 
  12266 #ifdef __LITTLE_ENDIAN__
  12267 #define vld1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  12268   poly8x16_t __ret; \
  12269   poly8x16_t __s1 = __p1; \
  12270   __ret = (poly8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 36); \
  12271   __ret; \
  12272 })
  12273 #else
  12274 #define vld1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  12275   poly8x16_t __ret; \
  12276   poly8x16_t __s1 = __p1; \
  12277   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12278   __ret = (poly8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 36); \
  12279   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12280   __ret; \
  12281 })
  12282 #endif
  12283 
  12284 #ifdef __LITTLE_ENDIAN__
  12285 #define vld1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  12286   poly16x8_t __ret; \
  12287   poly16x8_t __s1 = __p1; \
  12288   __ret = (poly16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 37); \
  12289   __ret; \
  12290 })
  12291 #else
  12292 #define vld1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  12293   poly16x8_t __ret; \
  12294   poly16x8_t __s1 = __p1; \
  12295   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  12296   __ret = (poly16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 37); \
  12297   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12298   __ret; \
  12299 })
  12300 #endif
  12301 
  12302 #ifdef __LITTLE_ENDIAN__
  12303 #define vld1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  12304   uint8x16_t __ret; \
  12305   uint8x16_t __s1 = __p1; \
  12306   __ret = (uint8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 48); \
  12307   __ret; \
  12308 })
  12309 #else
  12310 #define vld1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  12311   uint8x16_t __ret; \
  12312   uint8x16_t __s1 = __p1; \
  12313   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12314   __ret = (uint8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 48); \
  12315   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12316   __ret; \
  12317 })
  12318 #endif
  12319 
  12320 #ifdef __LITTLE_ENDIAN__
  12321 #define vld1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  12322   uint32x4_t __ret; \
  12323   uint32x4_t __s1 = __p1; \
  12324   __ret = (uint32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 50); \
  12325   __ret; \
  12326 })
  12327 #else
  12328 #define vld1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  12329   uint32x4_t __ret; \
  12330   uint32x4_t __s1 = __p1; \
  12331   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  12332   __ret = (uint32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 50); \
  12333   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12334   __ret; \
  12335 })
  12336 #endif
  12337 
  12338 #ifdef __LITTLE_ENDIAN__
  12339 #define vld1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  12340   uint64x2_t __ret; \
  12341   uint64x2_t __s1 = __p1; \
  12342   __ret = (uint64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 51); \
  12343   __ret; \
  12344 })
  12345 #else
  12346 #define vld1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  12347   uint64x2_t __ret; \
  12348   uint64x2_t __s1 = __p1; \
  12349   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  12350   __ret = (uint64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 51); \
  12351   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12352   __ret; \
  12353 })
  12354 #endif
  12355 
  12356 #ifdef __LITTLE_ENDIAN__
  12357 #define vld1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  12358   uint16x8_t __ret; \
  12359   uint16x8_t __s1 = __p1; \
  12360   __ret = (uint16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 49); \
  12361   __ret; \
  12362 })
  12363 #else
  12364 #define vld1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  12365   uint16x8_t __ret; \
  12366   uint16x8_t __s1 = __p1; \
  12367   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  12368   __ret = (uint16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 49); \
  12369   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12370   __ret; \
  12371 })
  12372 #endif
  12373 
  12374 #ifdef __LITTLE_ENDIAN__
  12375 #define vld1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  12376   int8x16_t __ret; \
  12377   int8x16_t __s1 = __p1; \
  12378   __ret = (int8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 32); \
  12379   __ret; \
  12380 })
  12381 #else
  12382 #define vld1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  12383   int8x16_t __ret; \
  12384   int8x16_t __s1 = __p1; \
  12385   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12386   __ret = (int8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 32); \
  12387   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12388   __ret; \
  12389 })
  12390 #endif
  12391 
  12392 #ifdef __LITTLE_ENDIAN__
  12393 #define vld1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  12394   float32x4_t __ret; \
  12395   float32x4_t __s1 = __p1; \
  12396   __ret = (float32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 41); \
  12397   __ret; \
  12398 })
  12399 #else
  12400 #define vld1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  12401   float32x4_t __ret; \
  12402   float32x4_t __s1 = __p1; \
  12403   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  12404   __ret = (float32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 41); \
  12405   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12406   __ret; \
  12407 })
  12408 #endif
  12409 
  12410 #ifdef __LITTLE_ENDIAN__
  12411 #define vld1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  12412   int32x4_t __ret; \
  12413   int32x4_t __s1 = __p1; \
  12414   __ret = (int32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 34); \
  12415   __ret; \
  12416 })
  12417 #else
  12418 #define vld1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  12419   int32x4_t __ret; \
  12420   int32x4_t __s1 = __p1; \
  12421   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  12422   __ret = (int32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 34); \
  12423   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12424   __ret; \
  12425 })
  12426 #endif
  12427 
  12428 #ifdef __LITTLE_ENDIAN__
  12429 #define vld1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  12430   int64x2_t __ret; \
  12431   int64x2_t __s1 = __p1; \
  12432   __ret = (int64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 35); \
  12433   __ret; \
  12434 })
  12435 #else
  12436 #define vld1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  12437   int64x2_t __ret; \
  12438   int64x2_t __s1 = __p1; \
  12439   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  12440   __ret = (int64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 35); \
  12441   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12442   __ret; \
  12443 })
  12444 #endif
  12445 
  12446 #ifdef __LITTLE_ENDIAN__
  12447 #define vld1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  12448   int16x8_t __ret; \
  12449   int16x8_t __s1 = __p1; \
  12450   __ret = (int16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 33); \
  12451   __ret; \
  12452 })
  12453 #else
  12454 #define vld1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  12455   int16x8_t __ret; \
  12456   int16x8_t __s1 = __p1; \
  12457   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  12458   __ret = (int16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 33); \
  12459   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12460   __ret; \
  12461 })
  12462 #endif
  12463 
  12464 #ifdef __LITTLE_ENDIAN__
  12465 #define vld1_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  12466   uint8x8_t __ret; \
  12467   uint8x8_t __s1 = __p1; \
  12468   __ret = (uint8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 16); \
  12469   __ret; \
  12470 })
  12471 #else
  12472 #define vld1_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  12473   uint8x8_t __ret; \
  12474   uint8x8_t __s1 = __p1; \
  12475   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  12476   __ret = (uint8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 16); \
  12477   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12478   __ret; \
  12479 })
  12480 #endif
  12481 
  12482 #ifdef __LITTLE_ENDIAN__
  12483 #define vld1_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  12484   uint32x2_t __ret; \
  12485   uint32x2_t __s1 = __p1; \
  12486   __ret = (uint32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 18); \
  12487   __ret; \
  12488 })
  12489 #else
  12490 #define vld1_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  12491   uint32x2_t __ret; \
  12492   uint32x2_t __s1 = __p1; \
  12493   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  12494   __ret = (uint32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 18); \
  12495   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12496   __ret; \
  12497 })
  12498 #endif
  12499 
  12500 #define vld1_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  12501   uint64x1_t __ret; \
  12502   uint64x1_t __s1 = __p1; \
  12503   __ret = (uint64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 19); \
  12504   __ret; \
  12505 })
  12506 #ifdef __LITTLE_ENDIAN__
  12507 #define vld1_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  12508   uint16x4_t __ret; \
  12509   uint16x4_t __s1 = __p1; \
  12510   __ret = (uint16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 17); \
  12511   __ret; \
  12512 })
  12513 #else
  12514 #define vld1_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  12515   uint16x4_t __ret; \
  12516   uint16x4_t __s1 = __p1; \
  12517   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  12518   __ret = (uint16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 17); \
  12519   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12520   __ret; \
  12521 })
  12522 #endif
  12523 
  12524 #ifdef __LITTLE_ENDIAN__
  12525 #define vld1_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  12526   int8x8_t __ret; \
  12527   int8x8_t __s1 = __p1; \
  12528   __ret = (int8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 0); \
  12529   __ret; \
  12530 })
  12531 #else
  12532 #define vld1_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  12533   int8x8_t __ret; \
  12534   int8x8_t __s1 = __p1; \
  12535   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  12536   __ret = (int8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 0); \
  12537   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  12538   __ret; \
  12539 })
  12540 #endif
  12541 
  12542 #ifdef __LITTLE_ENDIAN__
  12543 #define vld1_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  12544   float32x2_t __ret; \
  12545   float32x2_t __s1 = __p1; \
  12546   __ret = (float32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 9); \
  12547   __ret; \
  12548 })
  12549 #else
  12550 #define vld1_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  12551   float32x2_t __ret; \
  12552   float32x2_t __s1 = __p1; \
  12553   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  12554   __ret = (float32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 9); \
  12555   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12556   __ret; \
  12557 })
  12558 #endif
  12559 
  12560 #ifdef __LITTLE_ENDIAN__
  12561 #define vld1_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  12562   int32x2_t __ret; \
  12563   int32x2_t __s1 = __p1; \
  12564   __ret = (int32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 2); \
  12565   __ret; \
  12566 })
  12567 #else
  12568 #define vld1_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  12569   int32x2_t __ret; \
  12570   int32x2_t __s1 = __p1; \
  12571   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  12572   __ret = (int32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 2); \
  12573   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  12574   __ret; \
  12575 })
  12576 #endif
  12577 
  12578 #define vld1_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  12579   int64x1_t __ret; \
  12580   int64x1_t __s1 = __p1; \
  12581   __ret = (int64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 3); \
  12582   __ret; \
  12583 })
  12584 #ifdef __LITTLE_ENDIAN__
  12585 #define vld1_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  12586   int16x4_t __ret; \
  12587   int16x4_t __s1 = __p1; \
  12588   __ret = (int16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 1); \
  12589   __ret; \
  12590 })
  12591 #else
  12592 #define vld1_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  12593   int16x4_t __ret; \
  12594   int16x4_t __s1 = __p1; \
  12595   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  12596   __ret = (int16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 1); \
  12597   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  12598   __ret; \
  12599 })
  12600 #endif
  12601 
  12602 #ifdef __LITTLE_ENDIAN__
  12603 #define vld1_p8_x2(__p0) __extension__ ({ \
  12604   poly8x8x2_t __ret; \
  12605   __builtin_neon_vld1_x2_v(&__ret, __p0, 4); \
  12606   __ret; \
  12607 })
  12608 #else
  12609 #define vld1_p8_x2(__p0) __extension__ ({ \
  12610   poly8x8x2_t __ret; \
  12611   __builtin_neon_vld1_x2_v(&__ret, __p0, 4); \
  12612  \
  12613   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12614   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12615   __ret; \
  12616 })
  12617 #endif
  12618 
  12619 #ifdef __LITTLE_ENDIAN__
  12620 #define vld1_p16_x2(__p0) __extension__ ({ \
  12621   poly16x4x2_t __ret; \
  12622   __builtin_neon_vld1_x2_v(&__ret, __p0, 5); \
  12623   __ret; \
  12624 })
  12625 #else
  12626 #define vld1_p16_x2(__p0) __extension__ ({ \
  12627   poly16x4x2_t __ret; \
  12628   __builtin_neon_vld1_x2_v(&__ret, __p0, 5); \
  12629  \
  12630   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12631   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12632   __ret; \
  12633 })
  12634 #endif
  12635 
  12636 #ifdef __LITTLE_ENDIAN__
  12637 #define vld1q_p8_x2(__p0) __extension__ ({ \
  12638   poly8x16x2_t __ret; \
  12639   __builtin_neon_vld1q_x2_v(&__ret, __p0, 36); \
  12640   __ret; \
  12641 })
  12642 #else
  12643 #define vld1q_p8_x2(__p0) __extension__ ({ \
  12644   poly8x16x2_t __ret; \
  12645   __builtin_neon_vld1q_x2_v(&__ret, __p0, 36); \
  12646  \
  12647   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12648   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12649   __ret; \
  12650 })
  12651 #endif
  12652 
  12653 #ifdef __LITTLE_ENDIAN__
  12654 #define vld1q_p16_x2(__p0) __extension__ ({ \
  12655   poly16x8x2_t __ret; \
  12656   __builtin_neon_vld1q_x2_v(&__ret, __p0, 37); \
  12657   __ret; \
  12658 })
  12659 #else
  12660 #define vld1q_p16_x2(__p0) __extension__ ({ \
  12661   poly16x8x2_t __ret; \
  12662   __builtin_neon_vld1q_x2_v(&__ret, __p0, 37); \
  12663  \
  12664   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12665   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12666   __ret; \
  12667 })
  12668 #endif
  12669 
  12670 #ifdef __LITTLE_ENDIAN__
  12671 #define vld1q_u8_x2(__p0) __extension__ ({ \
  12672   uint8x16x2_t __ret; \
  12673   __builtin_neon_vld1q_x2_v(&__ret, __p0, 48); \
  12674   __ret; \
  12675 })
  12676 #else
  12677 #define vld1q_u8_x2(__p0) __extension__ ({ \
  12678   uint8x16x2_t __ret; \
  12679   __builtin_neon_vld1q_x2_v(&__ret, __p0, 48); \
  12680  \
  12681   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12682   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12683   __ret; \
  12684 })
  12685 #endif
  12686 
  12687 #ifdef __LITTLE_ENDIAN__
  12688 #define vld1q_u32_x2(__p0) __extension__ ({ \
  12689   uint32x4x2_t __ret; \
  12690   __builtin_neon_vld1q_x2_v(&__ret, __p0, 50); \
  12691   __ret; \
  12692 })
  12693 #else
  12694 #define vld1q_u32_x2(__p0) __extension__ ({ \
  12695   uint32x4x2_t __ret; \
  12696   __builtin_neon_vld1q_x2_v(&__ret, __p0, 50); \
  12697  \
  12698   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12699   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12700   __ret; \
  12701 })
  12702 #endif
  12703 
  12704 #ifdef __LITTLE_ENDIAN__
  12705 #define vld1q_u64_x2(__p0) __extension__ ({ \
  12706   uint64x2x2_t __ret; \
  12707   __builtin_neon_vld1q_x2_v(&__ret, __p0, 51); \
  12708   __ret; \
  12709 })
  12710 #else
  12711 #define vld1q_u64_x2(__p0) __extension__ ({ \
  12712   uint64x2x2_t __ret; \
  12713   __builtin_neon_vld1q_x2_v(&__ret, __p0, 51); \
  12714  \
  12715   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  12716   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  12717   __ret; \
  12718 })
  12719 #endif
  12720 
  12721 #ifdef __LITTLE_ENDIAN__
  12722 #define vld1q_u16_x2(__p0) __extension__ ({ \
  12723   uint16x8x2_t __ret; \
  12724   __builtin_neon_vld1q_x2_v(&__ret, __p0, 49); \
  12725   __ret; \
  12726 })
  12727 #else
  12728 #define vld1q_u16_x2(__p0) __extension__ ({ \
  12729   uint16x8x2_t __ret; \
  12730   __builtin_neon_vld1q_x2_v(&__ret, __p0, 49); \
  12731  \
  12732   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12733   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12734   __ret; \
  12735 })
  12736 #endif
  12737 
  12738 #ifdef __LITTLE_ENDIAN__
  12739 #define vld1q_s8_x2(__p0) __extension__ ({ \
  12740   int8x16x2_t __ret; \
  12741   __builtin_neon_vld1q_x2_v(&__ret, __p0, 32); \
  12742   __ret; \
  12743 })
  12744 #else
  12745 #define vld1q_s8_x2(__p0) __extension__ ({ \
  12746   int8x16x2_t __ret; \
  12747   __builtin_neon_vld1q_x2_v(&__ret, __p0, 32); \
  12748  \
  12749   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12750   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  12751   __ret; \
  12752 })
  12753 #endif
  12754 
  12755 #ifdef __LITTLE_ENDIAN__
  12756 #define vld1q_f32_x2(__p0) __extension__ ({ \
  12757   float32x4x2_t __ret; \
  12758   __builtin_neon_vld1q_x2_v(&__ret, __p0, 41); \
  12759   __ret; \
  12760 })
  12761 #else
  12762 #define vld1q_f32_x2(__p0) __extension__ ({ \
  12763   float32x4x2_t __ret; \
  12764   __builtin_neon_vld1q_x2_v(&__ret, __p0, 41); \
  12765  \
  12766   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12767   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12768   __ret; \
  12769 })
  12770 #endif
  12771 
  12772 #ifdef __LITTLE_ENDIAN__
  12773 #define vld1q_s32_x2(__p0) __extension__ ({ \
  12774   int32x4x2_t __ret; \
  12775   __builtin_neon_vld1q_x2_v(&__ret, __p0, 34); \
  12776   __ret; \
  12777 })
  12778 #else
  12779 #define vld1q_s32_x2(__p0) __extension__ ({ \
  12780   int32x4x2_t __ret; \
  12781   __builtin_neon_vld1q_x2_v(&__ret, __p0, 34); \
  12782  \
  12783   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12784   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12785   __ret; \
  12786 })
  12787 #endif
  12788 
  12789 #ifdef __LITTLE_ENDIAN__
  12790 #define vld1q_s64_x2(__p0) __extension__ ({ \
  12791   int64x2x2_t __ret; \
  12792   __builtin_neon_vld1q_x2_v(&__ret, __p0, 35); \
  12793   __ret; \
  12794 })
  12795 #else
  12796 #define vld1q_s64_x2(__p0) __extension__ ({ \
  12797   int64x2x2_t __ret; \
  12798   __builtin_neon_vld1q_x2_v(&__ret, __p0, 35); \
  12799  \
  12800   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  12801   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  12802   __ret; \
  12803 })
  12804 #endif
  12805 
  12806 #ifdef __LITTLE_ENDIAN__
  12807 #define vld1q_s16_x2(__p0) __extension__ ({ \
  12808   int16x8x2_t __ret; \
  12809   __builtin_neon_vld1q_x2_v(&__ret, __p0, 33); \
  12810   __ret; \
  12811 })
  12812 #else
  12813 #define vld1q_s16_x2(__p0) __extension__ ({ \
  12814   int16x8x2_t __ret; \
  12815   __builtin_neon_vld1q_x2_v(&__ret, __p0, 33); \
  12816  \
  12817   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12818   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12819   __ret; \
  12820 })
  12821 #endif
  12822 
  12823 #ifdef __LITTLE_ENDIAN__
  12824 #define vld1_u8_x2(__p0) __extension__ ({ \
  12825   uint8x8x2_t __ret; \
  12826   __builtin_neon_vld1_x2_v(&__ret, __p0, 16); \
  12827   __ret; \
  12828 })
  12829 #else
  12830 #define vld1_u8_x2(__p0) __extension__ ({ \
  12831   uint8x8x2_t __ret; \
  12832   __builtin_neon_vld1_x2_v(&__ret, __p0, 16); \
  12833  \
  12834   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12835   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12836   __ret; \
  12837 })
  12838 #endif
  12839 
  12840 #ifdef __LITTLE_ENDIAN__
  12841 #define vld1_u32_x2(__p0) __extension__ ({ \
  12842   uint32x2x2_t __ret; \
  12843   __builtin_neon_vld1_x2_v(&__ret, __p0, 18); \
  12844   __ret; \
  12845 })
  12846 #else
  12847 #define vld1_u32_x2(__p0) __extension__ ({ \
  12848   uint32x2x2_t __ret; \
  12849   __builtin_neon_vld1_x2_v(&__ret, __p0, 18); \
  12850  \
  12851   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  12852   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  12853   __ret; \
  12854 })
  12855 #endif
  12856 
  12857 #define vld1_u64_x2(__p0) __extension__ ({ \
  12858   uint64x1x2_t __ret; \
  12859   __builtin_neon_vld1_x2_v(&__ret, __p0, 19); \
  12860   __ret; \
  12861 })
  12862 #ifdef __LITTLE_ENDIAN__
  12863 #define vld1_u16_x2(__p0) __extension__ ({ \
  12864   uint16x4x2_t __ret; \
  12865   __builtin_neon_vld1_x2_v(&__ret, __p0, 17); \
  12866   __ret; \
  12867 })
  12868 #else
  12869 #define vld1_u16_x2(__p0) __extension__ ({ \
  12870   uint16x4x2_t __ret; \
  12871   __builtin_neon_vld1_x2_v(&__ret, __p0, 17); \
  12872  \
  12873   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12874   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12875   __ret; \
  12876 })
  12877 #endif
  12878 
  12879 #ifdef __LITTLE_ENDIAN__
  12880 #define vld1_s8_x2(__p0) __extension__ ({ \
  12881   int8x8x2_t __ret; \
  12882   __builtin_neon_vld1_x2_v(&__ret, __p0, 0); \
  12883   __ret; \
  12884 })
  12885 #else
  12886 #define vld1_s8_x2(__p0) __extension__ ({ \
  12887   int8x8x2_t __ret; \
  12888   __builtin_neon_vld1_x2_v(&__ret, __p0, 0); \
  12889  \
  12890   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12891   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12892   __ret; \
  12893 })
  12894 #endif
  12895 
  12896 #ifdef __LITTLE_ENDIAN__
  12897 #define vld1_f32_x2(__p0) __extension__ ({ \
  12898   float32x2x2_t __ret; \
  12899   __builtin_neon_vld1_x2_v(&__ret, __p0, 9); \
  12900   __ret; \
  12901 })
  12902 #else
  12903 #define vld1_f32_x2(__p0) __extension__ ({ \
  12904   float32x2x2_t __ret; \
  12905   __builtin_neon_vld1_x2_v(&__ret, __p0, 9); \
  12906  \
  12907   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  12908   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  12909   __ret; \
  12910 })
  12911 #endif
  12912 
  12913 #ifdef __LITTLE_ENDIAN__
  12914 #define vld1_s32_x2(__p0) __extension__ ({ \
  12915   int32x2x2_t __ret; \
  12916   __builtin_neon_vld1_x2_v(&__ret, __p0, 2); \
  12917   __ret; \
  12918 })
  12919 #else
  12920 #define vld1_s32_x2(__p0) __extension__ ({ \
  12921   int32x2x2_t __ret; \
  12922   __builtin_neon_vld1_x2_v(&__ret, __p0, 2); \
  12923  \
  12924   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  12925   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  12926   __ret; \
  12927 })
  12928 #endif
  12929 
  12930 #define vld1_s64_x2(__p0) __extension__ ({ \
  12931   int64x1x2_t __ret; \
  12932   __builtin_neon_vld1_x2_v(&__ret, __p0, 3); \
  12933   __ret; \
  12934 })
  12935 #ifdef __LITTLE_ENDIAN__
  12936 #define vld1_s16_x2(__p0) __extension__ ({ \
  12937   int16x4x2_t __ret; \
  12938   __builtin_neon_vld1_x2_v(&__ret, __p0, 1); \
  12939   __ret; \
  12940 })
  12941 #else
  12942 #define vld1_s16_x2(__p0) __extension__ ({ \
  12943   int16x4x2_t __ret; \
  12944   __builtin_neon_vld1_x2_v(&__ret, __p0, 1); \
  12945  \
  12946   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12947   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12948   __ret; \
  12949 })
  12950 #endif
  12951 
  12952 #ifdef __LITTLE_ENDIAN__
  12953 #define vld1_p8_x3(__p0) __extension__ ({ \
  12954   poly8x8x3_t __ret; \
  12955   __builtin_neon_vld1_x3_v(&__ret, __p0, 4); \
  12956   __ret; \
  12957 })
  12958 #else
  12959 #define vld1_p8_x3(__p0) __extension__ ({ \
  12960   poly8x8x3_t __ret; \
  12961   __builtin_neon_vld1_x3_v(&__ret, __p0, 4); \
  12962  \
  12963   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  12964   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  12965   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  12966   __ret; \
  12967 })
  12968 #endif
  12969 
  12970 #ifdef __LITTLE_ENDIAN__
  12971 #define vld1_p16_x3(__p0) __extension__ ({ \
  12972   poly16x4x3_t __ret; \
  12973   __builtin_neon_vld1_x3_v(&__ret, __p0, 5); \
  12974   __ret; \
  12975 })
  12976 #else
  12977 #define vld1_p16_x3(__p0) __extension__ ({ \
  12978   poly16x4x3_t __ret; \
  12979   __builtin_neon_vld1_x3_v(&__ret, __p0, 5); \
  12980  \
  12981   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  12982   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  12983   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  12984   __ret; \
  12985 })
  12986 #endif
  12987 
  12988 #ifdef __LITTLE_ENDIAN__
  12989 #define vld1q_p8_x3(__p0) __extension__ ({ \
  12990   poly8x16x3_t __ret; \
  12991   __builtin_neon_vld1q_x3_v(&__ret, __p0, 36); \
  12992   __ret; \
  12993 })
  12994 #else
  12995 #define vld1q_p8_x3(__p0) __extension__ ({ \
  12996   poly8x16x3_t __ret; \
  12997   __builtin_neon_vld1q_x3_v(&__ret, __p0, 36); \
  12998  \
  12999   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13000   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13001   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13002   __ret; \
  13003 })
  13004 #endif
  13005 
  13006 #ifdef __LITTLE_ENDIAN__
  13007 #define vld1q_p16_x3(__p0) __extension__ ({ \
  13008   poly16x8x3_t __ret; \
  13009   __builtin_neon_vld1q_x3_v(&__ret, __p0, 37); \
  13010   __ret; \
  13011 })
  13012 #else
  13013 #define vld1q_p16_x3(__p0) __extension__ ({ \
  13014   poly16x8x3_t __ret; \
  13015   __builtin_neon_vld1q_x3_v(&__ret, __p0, 37); \
  13016  \
  13017   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13018   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13019   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13020   __ret; \
  13021 })
  13022 #endif
  13023 
  13024 #ifdef __LITTLE_ENDIAN__
  13025 #define vld1q_u8_x3(__p0) __extension__ ({ \
  13026   uint8x16x3_t __ret; \
  13027   __builtin_neon_vld1q_x3_v(&__ret, __p0, 48); \
  13028   __ret; \
  13029 })
  13030 #else
  13031 #define vld1q_u8_x3(__p0) __extension__ ({ \
  13032   uint8x16x3_t __ret; \
  13033   __builtin_neon_vld1q_x3_v(&__ret, __p0, 48); \
  13034  \
  13035   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13036   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13037   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13038   __ret; \
  13039 })
  13040 #endif
  13041 
  13042 #ifdef __LITTLE_ENDIAN__
  13043 #define vld1q_u32_x3(__p0) __extension__ ({ \
  13044   uint32x4x3_t __ret; \
  13045   __builtin_neon_vld1q_x3_v(&__ret, __p0, 50); \
  13046   __ret; \
  13047 })
  13048 #else
  13049 #define vld1q_u32_x3(__p0) __extension__ ({ \
  13050   uint32x4x3_t __ret; \
  13051   __builtin_neon_vld1q_x3_v(&__ret, __p0, 50); \
  13052  \
  13053   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13054   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13055   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13056   __ret; \
  13057 })
  13058 #endif
  13059 
  13060 #ifdef __LITTLE_ENDIAN__
  13061 #define vld1q_u64_x3(__p0) __extension__ ({ \
  13062   uint64x2x3_t __ret; \
  13063   __builtin_neon_vld1q_x3_v(&__ret, __p0, 51); \
  13064   __ret; \
  13065 })
  13066 #else
  13067 #define vld1q_u64_x3(__p0) __extension__ ({ \
  13068   uint64x2x3_t __ret; \
  13069   __builtin_neon_vld1q_x3_v(&__ret, __p0, 51); \
  13070  \
  13071   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13072   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13073   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13074   __ret; \
  13075 })
  13076 #endif
  13077 
  13078 #ifdef __LITTLE_ENDIAN__
  13079 #define vld1q_u16_x3(__p0) __extension__ ({ \
  13080   uint16x8x3_t __ret; \
  13081   __builtin_neon_vld1q_x3_v(&__ret, __p0, 49); \
  13082   __ret; \
  13083 })
  13084 #else
  13085 #define vld1q_u16_x3(__p0) __extension__ ({ \
  13086   uint16x8x3_t __ret; \
  13087   __builtin_neon_vld1q_x3_v(&__ret, __p0, 49); \
  13088  \
  13089   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13090   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13091   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13092   __ret; \
  13093 })
  13094 #endif
  13095 
  13096 #ifdef __LITTLE_ENDIAN__
  13097 #define vld1q_s8_x3(__p0) __extension__ ({ \
  13098   int8x16x3_t __ret; \
  13099   __builtin_neon_vld1q_x3_v(&__ret, __p0, 32); \
  13100   __ret; \
  13101 })
  13102 #else
  13103 #define vld1q_s8_x3(__p0) __extension__ ({ \
  13104   int8x16x3_t __ret; \
  13105   __builtin_neon_vld1q_x3_v(&__ret, __p0, 32); \
  13106  \
  13107   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13108   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13109   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13110   __ret; \
  13111 })
  13112 #endif
  13113 
  13114 #ifdef __LITTLE_ENDIAN__
  13115 #define vld1q_f32_x3(__p0) __extension__ ({ \
  13116   float32x4x3_t __ret; \
  13117   __builtin_neon_vld1q_x3_v(&__ret, __p0, 41); \
  13118   __ret; \
  13119 })
  13120 #else
  13121 #define vld1q_f32_x3(__p0) __extension__ ({ \
  13122   float32x4x3_t __ret; \
  13123   __builtin_neon_vld1q_x3_v(&__ret, __p0, 41); \
  13124  \
  13125   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13126   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13127   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13128   __ret; \
  13129 })
  13130 #endif
  13131 
  13132 #ifdef __LITTLE_ENDIAN__
  13133 #define vld1q_s32_x3(__p0) __extension__ ({ \
  13134   int32x4x3_t __ret; \
  13135   __builtin_neon_vld1q_x3_v(&__ret, __p0, 34); \
  13136   __ret; \
  13137 })
  13138 #else
  13139 #define vld1q_s32_x3(__p0) __extension__ ({ \
  13140   int32x4x3_t __ret; \
  13141   __builtin_neon_vld1q_x3_v(&__ret, __p0, 34); \
  13142  \
  13143   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13144   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13145   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13146   __ret; \
  13147 })
  13148 #endif
  13149 
  13150 #ifdef __LITTLE_ENDIAN__
  13151 #define vld1q_s64_x3(__p0) __extension__ ({ \
  13152   int64x2x3_t __ret; \
  13153   __builtin_neon_vld1q_x3_v(&__ret, __p0, 35); \
  13154   __ret; \
  13155 })
  13156 #else
  13157 #define vld1q_s64_x3(__p0) __extension__ ({ \
  13158   int64x2x3_t __ret; \
  13159   __builtin_neon_vld1q_x3_v(&__ret, __p0, 35); \
  13160  \
  13161   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13162   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13163   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13164   __ret; \
  13165 })
  13166 #endif
  13167 
  13168 #ifdef __LITTLE_ENDIAN__
  13169 #define vld1q_s16_x3(__p0) __extension__ ({ \
  13170   int16x8x3_t __ret; \
  13171   __builtin_neon_vld1q_x3_v(&__ret, __p0, 33); \
  13172   __ret; \
  13173 })
  13174 #else
  13175 #define vld1q_s16_x3(__p0) __extension__ ({ \
  13176   int16x8x3_t __ret; \
  13177   __builtin_neon_vld1q_x3_v(&__ret, __p0, 33); \
  13178  \
  13179   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13180   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13181   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13182   __ret; \
  13183 })
  13184 #endif
  13185 
  13186 #ifdef __LITTLE_ENDIAN__
  13187 #define vld1_u8_x3(__p0) __extension__ ({ \
  13188   uint8x8x3_t __ret; \
  13189   __builtin_neon_vld1_x3_v(&__ret, __p0, 16); \
  13190   __ret; \
  13191 })
  13192 #else
  13193 #define vld1_u8_x3(__p0) __extension__ ({ \
  13194   uint8x8x3_t __ret; \
  13195   __builtin_neon_vld1_x3_v(&__ret, __p0, 16); \
  13196  \
  13197   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13198   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13199   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13200   __ret; \
  13201 })
  13202 #endif
  13203 
  13204 #ifdef __LITTLE_ENDIAN__
  13205 #define vld1_u32_x3(__p0) __extension__ ({ \
  13206   uint32x2x3_t __ret; \
  13207   __builtin_neon_vld1_x3_v(&__ret, __p0, 18); \
  13208   __ret; \
  13209 })
  13210 #else
  13211 #define vld1_u32_x3(__p0) __extension__ ({ \
  13212   uint32x2x3_t __ret; \
  13213   __builtin_neon_vld1_x3_v(&__ret, __p0, 18); \
  13214  \
  13215   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13216   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13217   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13218   __ret; \
  13219 })
  13220 #endif
  13221 
  13222 #define vld1_u64_x3(__p0) __extension__ ({ \
  13223   uint64x1x3_t __ret; \
  13224   __builtin_neon_vld1_x3_v(&__ret, __p0, 19); \
  13225   __ret; \
  13226 })
  13227 #ifdef __LITTLE_ENDIAN__
  13228 #define vld1_u16_x3(__p0) __extension__ ({ \
  13229   uint16x4x3_t __ret; \
  13230   __builtin_neon_vld1_x3_v(&__ret, __p0, 17); \
  13231   __ret; \
  13232 })
  13233 #else
  13234 #define vld1_u16_x3(__p0) __extension__ ({ \
  13235   uint16x4x3_t __ret; \
  13236   __builtin_neon_vld1_x3_v(&__ret, __p0, 17); \
  13237  \
  13238   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13239   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13240   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13241   __ret; \
  13242 })
  13243 #endif
  13244 
  13245 #ifdef __LITTLE_ENDIAN__
  13246 #define vld1_s8_x3(__p0) __extension__ ({ \
  13247   int8x8x3_t __ret; \
  13248   __builtin_neon_vld1_x3_v(&__ret, __p0, 0); \
  13249   __ret; \
  13250 })
  13251 #else
  13252 #define vld1_s8_x3(__p0) __extension__ ({ \
  13253   int8x8x3_t __ret; \
  13254   __builtin_neon_vld1_x3_v(&__ret, __p0, 0); \
  13255  \
  13256   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13257   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13258   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13259   __ret; \
  13260 })
  13261 #endif
  13262 
  13263 #ifdef __LITTLE_ENDIAN__
  13264 #define vld1_f32_x3(__p0) __extension__ ({ \
  13265   float32x2x3_t __ret; \
  13266   __builtin_neon_vld1_x3_v(&__ret, __p0, 9); \
  13267   __ret; \
  13268 })
  13269 #else
  13270 #define vld1_f32_x3(__p0) __extension__ ({ \
  13271   float32x2x3_t __ret; \
  13272   __builtin_neon_vld1_x3_v(&__ret, __p0, 9); \
  13273  \
  13274   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13275   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13276   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13277   __ret; \
  13278 })
  13279 #endif
  13280 
  13281 #ifdef __LITTLE_ENDIAN__
  13282 #define vld1_s32_x3(__p0) __extension__ ({ \
  13283   int32x2x3_t __ret; \
  13284   __builtin_neon_vld1_x3_v(&__ret, __p0, 2); \
  13285   __ret; \
  13286 })
  13287 #else
  13288 #define vld1_s32_x3(__p0) __extension__ ({ \
  13289   int32x2x3_t __ret; \
  13290   __builtin_neon_vld1_x3_v(&__ret, __p0, 2); \
  13291  \
  13292   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13293   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13294   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13295   __ret; \
  13296 })
  13297 #endif
  13298 
  13299 #define vld1_s64_x3(__p0) __extension__ ({ \
  13300   int64x1x3_t __ret; \
  13301   __builtin_neon_vld1_x3_v(&__ret, __p0, 3); \
  13302   __ret; \
  13303 })
  13304 #ifdef __LITTLE_ENDIAN__
  13305 #define vld1_s16_x3(__p0) __extension__ ({ \
  13306   int16x4x3_t __ret; \
  13307   __builtin_neon_vld1_x3_v(&__ret, __p0, 1); \
  13308   __ret; \
  13309 })
  13310 #else
  13311 #define vld1_s16_x3(__p0) __extension__ ({ \
  13312   int16x4x3_t __ret; \
  13313   __builtin_neon_vld1_x3_v(&__ret, __p0, 1); \
  13314  \
  13315   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13316   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13317   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13318   __ret; \
  13319 })
  13320 #endif
  13321 
  13322 #ifdef __LITTLE_ENDIAN__
  13323 #define vld1_p8_x4(__p0) __extension__ ({ \
  13324   poly8x8x4_t __ret; \
  13325   __builtin_neon_vld1_x4_v(&__ret, __p0, 4); \
  13326   __ret; \
  13327 })
  13328 #else
  13329 #define vld1_p8_x4(__p0) __extension__ ({ \
  13330   poly8x8x4_t __ret; \
  13331   __builtin_neon_vld1_x4_v(&__ret, __p0, 4); \
  13332  \
  13333   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13334   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13335   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13336   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  13337   __ret; \
  13338 })
  13339 #endif
  13340 
  13341 #ifdef __LITTLE_ENDIAN__
  13342 #define vld1_p16_x4(__p0) __extension__ ({ \
  13343   poly16x4x4_t __ret; \
  13344   __builtin_neon_vld1_x4_v(&__ret, __p0, 5); \
  13345   __ret; \
  13346 })
  13347 #else
  13348 #define vld1_p16_x4(__p0) __extension__ ({ \
  13349   poly16x4x4_t __ret; \
  13350   __builtin_neon_vld1_x4_v(&__ret, __p0, 5); \
  13351  \
  13352   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13353   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13354   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13355   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  13356   __ret; \
  13357 })
  13358 #endif
  13359 
  13360 #ifdef __LITTLE_ENDIAN__
  13361 #define vld1q_p8_x4(__p0) __extension__ ({ \
  13362   poly8x16x4_t __ret; \
  13363   __builtin_neon_vld1q_x4_v(&__ret, __p0, 36); \
  13364   __ret; \
  13365 })
  13366 #else
  13367 #define vld1q_p8_x4(__p0) __extension__ ({ \
  13368   poly8x16x4_t __ret; \
  13369   __builtin_neon_vld1q_x4_v(&__ret, __p0, 36); \
  13370  \
  13371   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13372   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13373   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13374   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13375   __ret; \
  13376 })
  13377 #endif
  13378 
  13379 #ifdef __LITTLE_ENDIAN__
  13380 #define vld1q_p16_x4(__p0) __extension__ ({ \
  13381   poly16x8x4_t __ret; \
  13382   __builtin_neon_vld1q_x4_v(&__ret, __p0, 37); \
  13383   __ret; \
  13384 })
  13385 #else
  13386 #define vld1q_p16_x4(__p0) __extension__ ({ \
  13387   poly16x8x4_t __ret; \
  13388   __builtin_neon_vld1q_x4_v(&__ret, __p0, 37); \
  13389  \
  13390   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13391   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13392   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13393   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  13394   __ret; \
  13395 })
  13396 #endif
  13397 
  13398 #ifdef __LITTLE_ENDIAN__
  13399 #define vld1q_u8_x4(__p0) __extension__ ({ \
  13400   uint8x16x4_t __ret; \
  13401   __builtin_neon_vld1q_x4_v(&__ret, __p0, 48); \
  13402   __ret; \
  13403 })
  13404 #else
  13405 #define vld1q_u8_x4(__p0) __extension__ ({ \
  13406   uint8x16x4_t __ret; \
  13407   __builtin_neon_vld1q_x4_v(&__ret, __p0, 48); \
  13408  \
  13409   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13410   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13411   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13412   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13413   __ret; \
  13414 })
  13415 #endif
  13416 
  13417 #ifdef __LITTLE_ENDIAN__
  13418 #define vld1q_u32_x4(__p0) __extension__ ({ \
  13419   uint32x4x4_t __ret; \
  13420   __builtin_neon_vld1q_x4_v(&__ret, __p0, 50); \
  13421   __ret; \
  13422 })
  13423 #else
  13424 #define vld1q_u32_x4(__p0) __extension__ ({ \
  13425   uint32x4x4_t __ret; \
  13426   __builtin_neon_vld1q_x4_v(&__ret, __p0, 50); \
  13427  \
  13428   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13429   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13430   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13431   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  13432   __ret; \
  13433 })
  13434 #endif
  13435 
  13436 #ifdef __LITTLE_ENDIAN__
  13437 #define vld1q_u64_x4(__p0) __extension__ ({ \
  13438   uint64x2x4_t __ret; \
  13439   __builtin_neon_vld1q_x4_v(&__ret, __p0, 51); \
  13440   __ret; \
  13441 })
  13442 #else
  13443 #define vld1q_u64_x4(__p0) __extension__ ({ \
  13444   uint64x2x4_t __ret; \
  13445   __builtin_neon_vld1q_x4_v(&__ret, __p0, 51); \
  13446  \
  13447   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13448   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13449   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13450   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  13451   __ret; \
  13452 })
  13453 #endif
  13454 
  13455 #ifdef __LITTLE_ENDIAN__
  13456 #define vld1q_u16_x4(__p0) __extension__ ({ \
  13457   uint16x8x4_t __ret; \
  13458   __builtin_neon_vld1q_x4_v(&__ret, __p0, 49); \
  13459   __ret; \
  13460 })
  13461 #else
  13462 #define vld1q_u16_x4(__p0) __extension__ ({ \
  13463   uint16x8x4_t __ret; \
  13464   __builtin_neon_vld1q_x4_v(&__ret, __p0, 49); \
  13465  \
  13466   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13467   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13468   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13469   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  13470   __ret; \
  13471 })
  13472 #endif
  13473 
  13474 #ifdef __LITTLE_ENDIAN__
  13475 #define vld1q_s8_x4(__p0) __extension__ ({ \
  13476   int8x16x4_t __ret; \
  13477   __builtin_neon_vld1q_x4_v(&__ret, __p0, 32); \
  13478   __ret; \
  13479 })
  13480 #else
  13481 #define vld1q_s8_x4(__p0) __extension__ ({ \
  13482   int8x16x4_t __ret; \
  13483   __builtin_neon_vld1q_x4_v(&__ret, __p0, 32); \
  13484  \
  13485   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13486   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13487   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13488   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13489   __ret; \
  13490 })
  13491 #endif
  13492 
  13493 #ifdef __LITTLE_ENDIAN__
  13494 #define vld1q_f32_x4(__p0) __extension__ ({ \
  13495   float32x4x4_t __ret; \
  13496   __builtin_neon_vld1q_x4_v(&__ret, __p0, 41); \
  13497   __ret; \
  13498 })
  13499 #else
  13500 #define vld1q_f32_x4(__p0) __extension__ ({ \
  13501   float32x4x4_t __ret; \
  13502   __builtin_neon_vld1q_x4_v(&__ret, __p0, 41); \
  13503  \
  13504   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13505   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13506   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13507   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  13508   __ret; \
  13509 })
  13510 #endif
  13511 
  13512 #ifdef __LITTLE_ENDIAN__
  13513 #define vld1q_s32_x4(__p0) __extension__ ({ \
  13514   int32x4x4_t __ret; \
  13515   __builtin_neon_vld1q_x4_v(&__ret, __p0, 34); \
  13516   __ret; \
  13517 })
  13518 #else
  13519 #define vld1q_s32_x4(__p0) __extension__ ({ \
  13520   int32x4x4_t __ret; \
  13521   __builtin_neon_vld1q_x4_v(&__ret, __p0, 34); \
  13522  \
  13523   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13524   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13525   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13526   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  13527   __ret; \
  13528 })
  13529 #endif
  13530 
  13531 #ifdef __LITTLE_ENDIAN__
  13532 #define vld1q_s64_x4(__p0) __extension__ ({ \
  13533   int64x2x4_t __ret; \
  13534   __builtin_neon_vld1q_x4_v(&__ret, __p0, 35); \
  13535   __ret; \
  13536 })
  13537 #else
  13538 #define vld1q_s64_x4(__p0) __extension__ ({ \
  13539   int64x2x4_t __ret; \
  13540   __builtin_neon_vld1q_x4_v(&__ret, __p0, 35); \
  13541  \
  13542   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13543   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13544   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13545   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  13546   __ret; \
  13547 })
  13548 #endif
  13549 
  13550 #ifdef __LITTLE_ENDIAN__
  13551 #define vld1q_s16_x4(__p0) __extension__ ({ \
  13552   int16x8x4_t __ret; \
  13553   __builtin_neon_vld1q_x4_v(&__ret, __p0, 33); \
  13554   __ret; \
  13555 })
  13556 #else
  13557 #define vld1q_s16_x4(__p0) __extension__ ({ \
  13558   int16x8x4_t __ret; \
  13559   __builtin_neon_vld1q_x4_v(&__ret, __p0, 33); \
  13560  \
  13561   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13562   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13563   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13564   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  13565   __ret; \
  13566 })
  13567 #endif
  13568 
  13569 #ifdef __LITTLE_ENDIAN__
  13570 #define vld1_u8_x4(__p0) __extension__ ({ \
  13571   uint8x8x4_t __ret; \
  13572   __builtin_neon_vld1_x4_v(&__ret, __p0, 16); \
  13573   __ret; \
  13574 })
  13575 #else
  13576 #define vld1_u8_x4(__p0) __extension__ ({ \
  13577   uint8x8x4_t __ret; \
  13578   __builtin_neon_vld1_x4_v(&__ret, __p0, 16); \
  13579  \
  13580   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13581   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13582   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13583   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  13584   __ret; \
  13585 })
  13586 #endif
  13587 
  13588 #ifdef __LITTLE_ENDIAN__
  13589 #define vld1_u32_x4(__p0) __extension__ ({ \
  13590   uint32x2x4_t __ret; \
  13591   __builtin_neon_vld1_x4_v(&__ret, __p0, 18); \
  13592   __ret; \
  13593 })
  13594 #else
  13595 #define vld1_u32_x4(__p0) __extension__ ({ \
  13596   uint32x2x4_t __ret; \
  13597   __builtin_neon_vld1_x4_v(&__ret, __p0, 18); \
  13598  \
  13599   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13600   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13601   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13602   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  13603   __ret; \
  13604 })
  13605 #endif
  13606 
  13607 #define vld1_u64_x4(__p0) __extension__ ({ \
  13608   uint64x1x4_t __ret; \
  13609   __builtin_neon_vld1_x4_v(&__ret, __p0, 19); \
  13610   __ret; \
  13611 })
  13612 #ifdef __LITTLE_ENDIAN__
  13613 #define vld1_u16_x4(__p0) __extension__ ({ \
  13614   uint16x4x4_t __ret; \
  13615   __builtin_neon_vld1_x4_v(&__ret, __p0, 17); \
  13616   __ret; \
  13617 })
  13618 #else
  13619 #define vld1_u16_x4(__p0) __extension__ ({ \
  13620   uint16x4x4_t __ret; \
  13621   __builtin_neon_vld1_x4_v(&__ret, __p0, 17); \
  13622  \
  13623   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13624   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13625   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13626   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  13627   __ret; \
  13628 })
  13629 #endif
  13630 
  13631 #ifdef __LITTLE_ENDIAN__
  13632 #define vld1_s8_x4(__p0) __extension__ ({ \
  13633   int8x8x4_t __ret; \
  13634   __builtin_neon_vld1_x4_v(&__ret, __p0, 0); \
  13635   __ret; \
  13636 })
  13637 #else
  13638 #define vld1_s8_x4(__p0) __extension__ ({ \
  13639   int8x8x4_t __ret; \
  13640   __builtin_neon_vld1_x4_v(&__ret, __p0, 0); \
  13641  \
  13642   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13643   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13644   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  13645   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  13646   __ret; \
  13647 })
  13648 #endif
  13649 
  13650 #ifdef __LITTLE_ENDIAN__
  13651 #define vld1_f32_x4(__p0) __extension__ ({ \
  13652   float32x2x4_t __ret; \
  13653   __builtin_neon_vld1_x4_v(&__ret, __p0, 9); \
  13654   __ret; \
  13655 })
  13656 #else
  13657 #define vld1_f32_x4(__p0) __extension__ ({ \
  13658   float32x2x4_t __ret; \
  13659   __builtin_neon_vld1_x4_v(&__ret, __p0, 9); \
  13660  \
  13661   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13662   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13663   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13664   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  13665   __ret; \
  13666 })
  13667 #endif
  13668 
  13669 #ifdef __LITTLE_ENDIAN__
  13670 #define vld1_s32_x4(__p0) __extension__ ({ \
  13671   int32x2x4_t __ret; \
  13672   __builtin_neon_vld1_x4_v(&__ret, __p0, 2); \
  13673   __ret; \
  13674 })
  13675 #else
  13676 #define vld1_s32_x4(__p0) __extension__ ({ \
  13677   int32x2x4_t __ret; \
  13678   __builtin_neon_vld1_x4_v(&__ret, __p0, 2); \
  13679  \
  13680   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13681   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13682   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  13683   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  13684   __ret; \
  13685 })
  13686 #endif
  13687 
  13688 #define vld1_s64_x4(__p0) __extension__ ({ \
  13689   int64x1x4_t __ret; \
  13690   __builtin_neon_vld1_x4_v(&__ret, __p0, 3); \
  13691   __ret; \
  13692 })
  13693 #ifdef __LITTLE_ENDIAN__
  13694 #define vld1_s16_x4(__p0) __extension__ ({ \
  13695   int16x4x4_t __ret; \
  13696   __builtin_neon_vld1_x4_v(&__ret, __p0, 1); \
  13697   __ret; \
  13698 })
  13699 #else
  13700 #define vld1_s16_x4(__p0) __extension__ ({ \
  13701   int16x4x4_t __ret; \
  13702   __builtin_neon_vld1_x4_v(&__ret, __p0, 1); \
  13703  \
  13704   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13705   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13706   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  13707   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  13708   __ret; \
  13709 })
  13710 #endif
  13711 
  13712 #ifdef __LITTLE_ENDIAN__
  13713 #define vld2_p8(__p0) __extension__ ({ \
  13714   poly8x8x2_t __ret; \
  13715   __builtin_neon_vld2_v(&__ret, __p0, 4); \
  13716   __ret; \
  13717 })
  13718 #else
  13719 #define vld2_p8(__p0) __extension__ ({ \
  13720   poly8x8x2_t __ret; \
  13721   __builtin_neon_vld2_v(&__ret, __p0, 4); \
  13722  \
  13723   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13724   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13725   __ret; \
  13726 })
  13727 #endif
  13728 
  13729 #ifdef __LITTLE_ENDIAN__
  13730 #define vld2_p16(__p0) __extension__ ({ \
  13731   poly16x4x2_t __ret; \
  13732   __builtin_neon_vld2_v(&__ret, __p0, 5); \
  13733   __ret; \
  13734 })
  13735 #else
  13736 #define vld2_p16(__p0) __extension__ ({ \
  13737   poly16x4x2_t __ret; \
  13738   __builtin_neon_vld2_v(&__ret, __p0, 5); \
  13739  \
  13740   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13741   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13742   __ret; \
  13743 })
  13744 #endif
  13745 
  13746 #ifdef __LITTLE_ENDIAN__
  13747 #define vld2q_p8(__p0) __extension__ ({ \
  13748   poly8x16x2_t __ret; \
  13749   __builtin_neon_vld2q_v(&__ret, __p0, 36); \
  13750   __ret; \
  13751 })
  13752 #else
  13753 #define vld2q_p8(__p0) __extension__ ({ \
  13754   poly8x16x2_t __ret; \
  13755   __builtin_neon_vld2q_v(&__ret, __p0, 36); \
  13756  \
  13757   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13758   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13759   __ret; \
  13760 })
  13761 #endif
  13762 
  13763 #ifdef __LITTLE_ENDIAN__
  13764 #define vld2q_p16(__p0) __extension__ ({ \
  13765   poly16x8x2_t __ret; \
  13766   __builtin_neon_vld2q_v(&__ret, __p0, 37); \
  13767   __ret; \
  13768 })
  13769 #else
  13770 #define vld2q_p16(__p0) __extension__ ({ \
  13771   poly16x8x2_t __ret; \
  13772   __builtin_neon_vld2q_v(&__ret, __p0, 37); \
  13773  \
  13774   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13775   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13776   __ret; \
  13777 })
  13778 #endif
  13779 
  13780 #ifdef __LITTLE_ENDIAN__
  13781 #define vld2q_u8(__p0) __extension__ ({ \
  13782   uint8x16x2_t __ret; \
  13783   __builtin_neon_vld2q_v(&__ret, __p0, 48); \
  13784   __ret; \
  13785 })
  13786 #else
  13787 #define vld2q_u8(__p0) __extension__ ({ \
  13788   uint8x16x2_t __ret; \
  13789   __builtin_neon_vld2q_v(&__ret, __p0, 48); \
  13790  \
  13791   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13792   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13793   __ret; \
  13794 })
  13795 #endif
  13796 
  13797 #ifdef __LITTLE_ENDIAN__
  13798 #define vld2q_u32(__p0) __extension__ ({ \
  13799   uint32x4x2_t __ret; \
  13800   __builtin_neon_vld2q_v(&__ret, __p0, 50); \
  13801   __ret; \
  13802 })
  13803 #else
  13804 #define vld2q_u32(__p0) __extension__ ({ \
  13805   uint32x4x2_t __ret; \
  13806   __builtin_neon_vld2q_v(&__ret, __p0, 50); \
  13807  \
  13808   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13809   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13810   __ret; \
  13811 })
  13812 #endif
  13813 
  13814 #ifdef __LITTLE_ENDIAN__
  13815 #define vld2q_u16(__p0) __extension__ ({ \
  13816   uint16x8x2_t __ret; \
  13817   __builtin_neon_vld2q_v(&__ret, __p0, 49); \
  13818   __ret; \
  13819 })
  13820 #else
  13821 #define vld2q_u16(__p0) __extension__ ({ \
  13822   uint16x8x2_t __ret; \
  13823   __builtin_neon_vld2q_v(&__ret, __p0, 49); \
  13824  \
  13825   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13826   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13827   __ret; \
  13828 })
  13829 #endif
  13830 
  13831 #ifdef __LITTLE_ENDIAN__
  13832 #define vld2q_s8(__p0) __extension__ ({ \
  13833   int8x16x2_t __ret; \
  13834   __builtin_neon_vld2q_v(&__ret, __p0, 32); \
  13835   __ret; \
  13836 })
  13837 #else
  13838 #define vld2q_s8(__p0) __extension__ ({ \
  13839   int8x16x2_t __ret; \
  13840   __builtin_neon_vld2q_v(&__ret, __p0, 32); \
  13841  \
  13842   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13843   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  13844   __ret; \
  13845 })
  13846 #endif
  13847 
  13848 #ifdef __LITTLE_ENDIAN__
  13849 #define vld2q_f32(__p0) __extension__ ({ \
  13850   float32x4x2_t __ret; \
  13851   __builtin_neon_vld2q_v(&__ret, __p0, 41); \
  13852   __ret; \
  13853 })
  13854 #else
  13855 #define vld2q_f32(__p0) __extension__ ({ \
  13856   float32x4x2_t __ret; \
  13857   __builtin_neon_vld2q_v(&__ret, __p0, 41); \
  13858  \
  13859   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13860   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13861   __ret; \
  13862 })
  13863 #endif
  13864 
  13865 #ifdef __LITTLE_ENDIAN__
  13866 #define vld2q_s32(__p0) __extension__ ({ \
  13867   int32x4x2_t __ret; \
  13868   __builtin_neon_vld2q_v(&__ret, __p0, 34); \
  13869   __ret; \
  13870 })
  13871 #else
  13872 #define vld2q_s32(__p0) __extension__ ({ \
  13873   int32x4x2_t __ret; \
  13874   __builtin_neon_vld2q_v(&__ret, __p0, 34); \
  13875  \
  13876   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13877   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13878   __ret; \
  13879 })
  13880 #endif
  13881 
  13882 #ifdef __LITTLE_ENDIAN__
  13883 #define vld2q_s16(__p0) __extension__ ({ \
  13884   int16x8x2_t __ret; \
  13885   __builtin_neon_vld2q_v(&__ret, __p0, 33); \
  13886   __ret; \
  13887 })
  13888 #else
  13889 #define vld2q_s16(__p0) __extension__ ({ \
  13890   int16x8x2_t __ret; \
  13891   __builtin_neon_vld2q_v(&__ret, __p0, 33); \
  13892  \
  13893   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13894   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13895   __ret; \
  13896 })
  13897 #endif
  13898 
  13899 #ifdef __LITTLE_ENDIAN__
  13900 #define vld2_u8(__p0) __extension__ ({ \
  13901   uint8x8x2_t __ret; \
  13902   __builtin_neon_vld2_v(&__ret, __p0, 16); \
  13903   __ret; \
  13904 })
  13905 #else
  13906 #define vld2_u8(__p0) __extension__ ({ \
  13907   uint8x8x2_t __ret; \
  13908   __builtin_neon_vld2_v(&__ret, __p0, 16); \
  13909  \
  13910   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13911   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13912   __ret; \
  13913 })
  13914 #endif
  13915 
  13916 #ifdef __LITTLE_ENDIAN__
  13917 #define vld2_u32(__p0) __extension__ ({ \
  13918   uint32x2x2_t __ret; \
  13919   __builtin_neon_vld2_v(&__ret, __p0, 18); \
  13920   __ret; \
  13921 })
  13922 #else
  13923 #define vld2_u32(__p0) __extension__ ({ \
  13924   uint32x2x2_t __ret; \
  13925   __builtin_neon_vld2_v(&__ret, __p0, 18); \
  13926  \
  13927   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13928   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13929   __ret; \
  13930 })
  13931 #endif
  13932 
  13933 #define vld2_u64(__p0) __extension__ ({ \
  13934   uint64x1x2_t __ret; \
  13935   __builtin_neon_vld2_v(&__ret, __p0, 19); \
  13936   __ret; \
  13937 })
  13938 #ifdef __LITTLE_ENDIAN__
  13939 #define vld2_u16(__p0) __extension__ ({ \
  13940   uint16x4x2_t __ret; \
  13941   __builtin_neon_vld2_v(&__ret, __p0, 17); \
  13942   __ret; \
  13943 })
  13944 #else
  13945 #define vld2_u16(__p0) __extension__ ({ \
  13946   uint16x4x2_t __ret; \
  13947   __builtin_neon_vld2_v(&__ret, __p0, 17); \
  13948  \
  13949   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  13950   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  13951   __ret; \
  13952 })
  13953 #endif
  13954 
  13955 #ifdef __LITTLE_ENDIAN__
  13956 #define vld2_s8(__p0) __extension__ ({ \
  13957   int8x8x2_t __ret; \
  13958   __builtin_neon_vld2_v(&__ret, __p0, 0); \
  13959   __ret; \
  13960 })
  13961 #else
  13962 #define vld2_s8(__p0) __extension__ ({ \
  13963   int8x8x2_t __ret; \
  13964   __builtin_neon_vld2_v(&__ret, __p0, 0); \
  13965  \
  13966   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  13967   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  13968   __ret; \
  13969 })
  13970 #endif
  13971 
  13972 #ifdef __LITTLE_ENDIAN__
  13973 #define vld2_f32(__p0) __extension__ ({ \
  13974   float32x2x2_t __ret; \
  13975   __builtin_neon_vld2_v(&__ret, __p0, 9); \
  13976   __ret; \
  13977 })
  13978 #else
  13979 #define vld2_f32(__p0) __extension__ ({ \
  13980   float32x2x2_t __ret; \
  13981   __builtin_neon_vld2_v(&__ret, __p0, 9); \
  13982  \
  13983   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  13984   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  13985   __ret; \
  13986 })
  13987 #endif
  13988 
  13989 #ifdef __LITTLE_ENDIAN__
  13990 #define vld2_s32(__p0) __extension__ ({ \
  13991   int32x2x2_t __ret; \
  13992   __builtin_neon_vld2_v(&__ret, __p0, 2); \
  13993   __ret; \
  13994 })
  13995 #else
  13996 #define vld2_s32(__p0) __extension__ ({ \
  13997   int32x2x2_t __ret; \
  13998   __builtin_neon_vld2_v(&__ret, __p0, 2); \
  13999  \
  14000   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14001   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14002   __ret; \
  14003 })
  14004 #endif
  14005 
  14006 #define vld2_s64(__p0) __extension__ ({ \
  14007   int64x1x2_t __ret; \
  14008   __builtin_neon_vld2_v(&__ret, __p0, 3); \
  14009   __ret; \
  14010 })
  14011 #ifdef __LITTLE_ENDIAN__
  14012 #define vld2_s16(__p0) __extension__ ({ \
  14013   int16x4x2_t __ret; \
  14014   __builtin_neon_vld2_v(&__ret, __p0, 1); \
  14015   __ret; \
  14016 })
  14017 #else
  14018 #define vld2_s16(__p0) __extension__ ({ \
  14019   int16x4x2_t __ret; \
  14020   __builtin_neon_vld2_v(&__ret, __p0, 1); \
  14021  \
  14022   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14023   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14024   __ret; \
  14025 })
  14026 #endif
  14027 
  14028 #ifdef __LITTLE_ENDIAN__
  14029 #define vld2_dup_p8(__p0) __extension__ ({ \
  14030   poly8x8x2_t __ret; \
  14031   __builtin_neon_vld2_dup_v(&__ret, __p0, 4); \
  14032   __ret; \
  14033 })
  14034 #else
  14035 #define vld2_dup_p8(__p0) __extension__ ({ \
  14036   poly8x8x2_t __ret; \
  14037   __builtin_neon_vld2_dup_v(&__ret, __p0, 4); \
  14038  \
  14039   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14040   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14041   __ret; \
  14042 })
  14043 #endif
  14044 
  14045 #ifdef __LITTLE_ENDIAN__
  14046 #define vld2_dup_p16(__p0) __extension__ ({ \
  14047   poly16x4x2_t __ret; \
  14048   __builtin_neon_vld2_dup_v(&__ret, __p0, 5); \
  14049   __ret; \
  14050 })
  14051 #else
  14052 #define vld2_dup_p16(__p0) __extension__ ({ \
  14053   poly16x4x2_t __ret; \
  14054   __builtin_neon_vld2_dup_v(&__ret, __p0, 5); \
  14055  \
  14056   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14057   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14058   __ret; \
  14059 })
  14060 #endif
  14061 
  14062 #ifdef __LITTLE_ENDIAN__
  14063 #define vld2q_dup_p8(__p0) __extension__ ({ \
  14064   poly8x16x2_t __ret; \
  14065   __builtin_neon_vld2q_dup_v(&__ret, __p0, 36); \
  14066   __ret; \
  14067 })
  14068 #else
  14069 #define vld2q_dup_p8(__p0) __extension__ ({ \
  14070   poly8x16x2_t __ret; \
  14071   __builtin_neon_vld2q_dup_v(&__ret, __p0, 36); \
  14072  \
  14073   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14074   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14075   __ret; \
  14076 })
  14077 #endif
  14078 
  14079 #ifdef __LITTLE_ENDIAN__
  14080 #define vld2q_dup_p16(__p0) __extension__ ({ \
  14081   poly16x8x2_t __ret; \
  14082   __builtin_neon_vld2q_dup_v(&__ret, __p0, 37); \
  14083   __ret; \
  14084 })
  14085 #else
  14086 #define vld2q_dup_p16(__p0) __extension__ ({ \
  14087   poly16x8x2_t __ret; \
  14088   __builtin_neon_vld2q_dup_v(&__ret, __p0, 37); \
  14089  \
  14090   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14091   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14092   __ret; \
  14093 })
  14094 #endif
  14095 
  14096 #ifdef __LITTLE_ENDIAN__
  14097 #define vld2q_dup_u8(__p0) __extension__ ({ \
  14098   uint8x16x2_t __ret; \
  14099   __builtin_neon_vld2q_dup_v(&__ret, __p0, 48); \
  14100   __ret; \
  14101 })
  14102 #else
  14103 #define vld2q_dup_u8(__p0) __extension__ ({ \
  14104   uint8x16x2_t __ret; \
  14105   __builtin_neon_vld2q_dup_v(&__ret, __p0, 48); \
  14106  \
  14107   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14108   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14109   __ret; \
  14110 })
  14111 #endif
  14112 
  14113 #ifdef __LITTLE_ENDIAN__
  14114 #define vld2q_dup_u32(__p0) __extension__ ({ \
  14115   uint32x4x2_t __ret; \
  14116   __builtin_neon_vld2q_dup_v(&__ret, __p0, 50); \
  14117   __ret; \
  14118 })
  14119 #else
  14120 #define vld2q_dup_u32(__p0) __extension__ ({ \
  14121   uint32x4x2_t __ret; \
  14122   __builtin_neon_vld2q_dup_v(&__ret, __p0, 50); \
  14123  \
  14124   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14125   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14126   __ret; \
  14127 })
  14128 #endif
  14129 
  14130 #ifdef __LITTLE_ENDIAN__
  14131 #define vld2q_dup_u64(__p0) __extension__ ({ \
  14132   uint64x2x2_t __ret; \
  14133   __builtin_neon_vld2q_dup_v(&__ret, __p0, 51); \
  14134   __ret; \
  14135 })
  14136 #else
  14137 #define vld2q_dup_u64(__p0) __extension__ ({ \
  14138   uint64x2x2_t __ret; \
  14139   __builtin_neon_vld2q_dup_v(&__ret, __p0, 51); \
  14140  \
  14141   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14142   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14143   __ret; \
  14144 })
  14145 #endif
  14146 
  14147 #ifdef __LITTLE_ENDIAN__
  14148 #define vld2q_dup_u16(__p0) __extension__ ({ \
  14149   uint16x8x2_t __ret; \
  14150   __builtin_neon_vld2q_dup_v(&__ret, __p0, 49); \
  14151   __ret; \
  14152 })
  14153 #else
  14154 #define vld2q_dup_u16(__p0) __extension__ ({ \
  14155   uint16x8x2_t __ret; \
  14156   __builtin_neon_vld2q_dup_v(&__ret, __p0, 49); \
  14157  \
  14158   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14159   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14160   __ret; \
  14161 })
  14162 #endif
  14163 
  14164 #ifdef __LITTLE_ENDIAN__
  14165 #define vld2q_dup_s8(__p0) __extension__ ({ \
  14166   int8x16x2_t __ret; \
  14167   __builtin_neon_vld2q_dup_v(&__ret, __p0, 32); \
  14168   __ret; \
  14169 })
  14170 #else
  14171 #define vld2q_dup_s8(__p0) __extension__ ({ \
  14172   int8x16x2_t __ret; \
  14173   __builtin_neon_vld2q_dup_v(&__ret, __p0, 32); \
  14174  \
  14175   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14176   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14177   __ret; \
  14178 })
  14179 #endif
  14180 
  14181 #ifdef __LITTLE_ENDIAN__
  14182 #define vld2q_dup_f32(__p0) __extension__ ({ \
  14183   float32x4x2_t __ret; \
  14184   __builtin_neon_vld2q_dup_v(&__ret, __p0, 41); \
  14185   __ret; \
  14186 })
  14187 #else
  14188 #define vld2q_dup_f32(__p0) __extension__ ({ \
  14189   float32x4x2_t __ret; \
  14190   __builtin_neon_vld2q_dup_v(&__ret, __p0, 41); \
  14191  \
  14192   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14193   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14194   __ret; \
  14195 })
  14196 #endif
  14197 
  14198 #ifdef __LITTLE_ENDIAN__
  14199 #define vld2q_dup_s32(__p0) __extension__ ({ \
  14200   int32x4x2_t __ret; \
  14201   __builtin_neon_vld2q_dup_v(&__ret, __p0, 34); \
  14202   __ret; \
  14203 })
  14204 #else
  14205 #define vld2q_dup_s32(__p0) __extension__ ({ \
  14206   int32x4x2_t __ret; \
  14207   __builtin_neon_vld2q_dup_v(&__ret, __p0, 34); \
  14208  \
  14209   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14210   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14211   __ret; \
  14212 })
  14213 #endif
  14214 
  14215 #ifdef __LITTLE_ENDIAN__
  14216 #define vld2q_dup_s64(__p0) __extension__ ({ \
  14217   int64x2x2_t __ret; \
  14218   __builtin_neon_vld2q_dup_v(&__ret, __p0, 35); \
  14219   __ret; \
  14220 })
  14221 #else
  14222 #define vld2q_dup_s64(__p0) __extension__ ({ \
  14223   int64x2x2_t __ret; \
  14224   __builtin_neon_vld2q_dup_v(&__ret, __p0, 35); \
  14225  \
  14226   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14227   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14228   __ret; \
  14229 })
  14230 #endif
  14231 
  14232 #ifdef __LITTLE_ENDIAN__
  14233 #define vld2q_dup_s16(__p0) __extension__ ({ \
  14234   int16x8x2_t __ret; \
  14235   __builtin_neon_vld2q_dup_v(&__ret, __p0, 33); \
  14236   __ret; \
  14237 })
  14238 #else
  14239 #define vld2q_dup_s16(__p0) __extension__ ({ \
  14240   int16x8x2_t __ret; \
  14241   __builtin_neon_vld2q_dup_v(&__ret, __p0, 33); \
  14242  \
  14243   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14244   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14245   __ret; \
  14246 })
  14247 #endif
  14248 
  14249 #ifdef __LITTLE_ENDIAN__
  14250 #define vld2_dup_u8(__p0) __extension__ ({ \
  14251   uint8x8x2_t __ret; \
  14252   __builtin_neon_vld2_dup_v(&__ret, __p0, 16); \
  14253   __ret; \
  14254 })
  14255 #else
  14256 #define vld2_dup_u8(__p0) __extension__ ({ \
  14257   uint8x8x2_t __ret; \
  14258   __builtin_neon_vld2_dup_v(&__ret, __p0, 16); \
  14259  \
  14260   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14261   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14262   __ret; \
  14263 })
  14264 #endif
  14265 
  14266 #ifdef __LITTLE_ENDIAN__
  14267 #define vld2_dup_u32(__p0) __extension__ ({ \
  14268   uint32x2x2_t __ret; \
  14269   __builtin_neon_vld2_dup_v(&__ret, __p0, 18); \
  14270   __ret; \
  14271 })
  14272 #else
  14273 #define vld2_dup_u32(__p0) __extension__ ({ \
  14274   uint32x2x2_t __ret; \
  14275   __builtin_neon_vld2_dup_v(&__ret, __p0, 18); \
  14276  \
  14277   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14278   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14279   __ret; \
  14280 })
  14281 #endif
  14282 
  14283 #define vld2_dup_u64(__p0) __extension__ ({ \
  14284   uint64x1x2_t __ret; \
  14285   __builtin_neon_vld2_dup_v(&__ret, __p0, 19); \
  14286   __ret; \
  14287 })
  14288 #ifdef __LITTLE_ENDIAN__
  14289 #define vld2_dup_u16(__p0) __extension__ ({ \
  14290   uint16x4x2_t __ret; \
  14291   __builtin_neon_vld2_dup_v(&__ret, __p0, 17); \
  14292   __ret; \
  14293 })
  14294 #else
  14295 #define vld2_dup_u16(__p0) __extension__ ({ \
  14296   uint16x4x2_t __ret; \
  14297   __builtin_neon_vld2_dup_v(&__ret, __p0, 17); \
  14298  \
  14299   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14300   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14301   __ret; \
  14302 })
  14303 #endif
  14304 
  14305 #ifdef __LITTLE_ENDIAN__
  14306 #define vld2_dup_s8(__p0) __extension__ ({ \
  14307   int8x8x2_t __ret; \
  14308   __builtin_neon_vld2_dup_v(&__ret, __p0, 0); \
  14309   __ret; \
  14310 })
  14311 #else
  14312 #define vld2_dup_s8(__p0) __extension__ ({ \
  14313   int8x8x2_t __ret; \
  14314   __builtin_neon_vld2_dup_v(&__ret, __p0, 0); \
  14315  \
  14316   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14317   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14318   __ret; \
  14319 })
  14320 #endif
  14321 
  14322 #ifdef __LITTLE_ENDIAN__
  14323 #define vld2_dup_f32(__p0) __extension__ ({ \
  14324   float32x2x2_t __ret; \
  14325   __builtin_neon_vld2_dup_v(&__ret, __p0, 9); \
  14326   __ret; \
  14327 })
  14328 #else
  14329 #define vld2_dup_f32(__p0) __extension__ ({ \
  14330   float32x2x2_t __ret; \
  14331   __builtin_neon_vld2_dup_v(&__ret, __p0, 9); \
  14332  \
  14333   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14334   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14335   __ret; \
  14336 })
  14337 #endif
  14338 
  14339 #ifdef __LITTLE_ENDIAN__
  14340 #define vld2_dup_s32(__p0) __extension__ ({ \
  14341   int32x2x2_t __ret; \
  14342   __builtin_neon_vld2_dup_v(&__ret, __p0, 2); \
  14343   __ret; \
  14344 })
  14345 #else
  14346 #define vld2_dup_s32(__p0) __extension__ ({ \
  14347   int32x2x2_t __ret; \
  14348   __builtin_neon_vld2_dup_v(&__ret, __p0, 2); \
  14349  \
  14350   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14351   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14352   __ret; \
  14353 })
  14354 #endif
  14355 
  14356 #define vld2_dup_s64(__p0) __extension__ ({ \
  14357   int64x1x2_t __ret; \
  14358   __builtin_neon_vld2_dup_v(&__ret, __p0, 3); \
  14359   __ret; \
  14360 })
  14361 #ifdef __LITTLE_ENDIAN__
  14362 #define vld2_dup_s16(__p0) __extension__ ({ \
  14363   int16x4x2_t __ret; \
  14364   __builtin_neon_vld2_dup_v(&__ret, __p0, 1); \
  14365   __ret; \
  14366 })
  14367 #else
  14368 #define vld2_dup_s16(__p0) __extension__ ({ \
  14369   int16x4x2_t __ret; \
  14370   __builtin_neon_vld2_dup_v(&__ret, __p0, 1); \
  14371  \
  14372   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14373   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14374   __ret; \
  14375 })
  14376 #endif
  14377 
  14378 #ifdef __LITTLE_ENDIAN__
  14379 #define vld2_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  14380   poly8x8x2_t __ret; \
  14381   poly8x8x2_t __s1 = __p1; \
  14382   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 4); \
  14383   __ret; \
  14384 })
  14385 #else
  14386 #define vld2_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  14387   poly8x8x2_t __ret; \
  14388   poly8x8x2_t __s1 = __p1; \
  14389   poly8x8x2_t __rev1; \
  14390   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14391   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14392   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 4); \
  14393  \
  14394   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14395   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14396   __ret; \
  14397 })
  14398 #endif
  14399 
  14400 #ifdef __LITTLE_ENDIAN__
  14401 #define vld2_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  14402   poly16x4x2_t __ret; \
  14403   poly16x4x2_t __s1 = __p1; \
  14404   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 5); \
  14405   __ret; \
  14406 })
  14407 #else
  14408 #define vld2_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  14409   poly16x4x2_t __ret; \
  14410   poly16x4x2_t __s1 = __p1; \
  14411   poly16x4x2_t __rev1; \
  14412   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  14413   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  14414   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 5); \
  14415  \
  14416   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14417   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14418   __ret; \
  14419 })
  14420 #endif
  14421 
  14422 #ifdef __LITTLE_ENDIAN__
  14423 #define vld2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  14424   poly16x8x2_t __ret; \
  14425   poly16x8x2_t __s1 = __p1; \
  14426   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 37); \
  14427   __ret; \
  14428 })
  14429 #else
  14430 #define vld2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  14431   poly16x8x2_t __ret; \
  14432   poly16x8x2_t __s1 = __p1; \
  14433   poly16x8x2_t __rev1; \
  14434   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14435   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14436   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 37); \
  14437  \
  14438   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14439   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14440   __ret; \
  14441 })
  14442 #endif
  14443 
  14444 #ifdef __LITTLE_ENDIAN__
  14445 #define vld2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  14446   uint32x4x2_t __ret; \
  14447   uint32x4x2_t __s1 = __p1; \
  14448   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 50); \
  14449   __ret; \
  14450 })
  14451 #else
  14452 #define vld2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  14453   uint32x4x2_t __ret; \
  14454   uint32x4x2_t __s1 = __p1; \
  14455   uint32x4x2_t __rev1; \
  14456   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  14457   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  14458   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 50); \
  14459  \
  14460   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14461   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14462   __ret; \
  14463 })
  14464 #endif
  14465 
  14466 #ifdef __LITTLE_ENDIAN__
  14467 #define vld2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  14468   uint16x8x2_t __ret; \
  14469   uint16x8x2_t __s1 = __p1; \
  14470   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 49); \
  14471   __ret; \
  14472 })
  14473 #else
  14474 #define vld2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  14475   uint16x8x2_t __ret; \
  14476   uint16x8x2_t __s1 = __p1; \
  14477   uint16x8x2_t __rev1; \
  14478   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14479   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14480   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 49); \
  14481  \
  14482   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14483   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14484   __ret; \
  14485 })
  14486 #endif
  14487 
  14488 #ifdef __LITTLE_ENDIAN__
  14489 #define vld2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  14490   float32x4x2_t __ret; \
  14491   float32x4x2_t __s1 = __p1; \
  14492   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 41); \
  14493   __ret; \
  14494 })
  14495 #else
  14496 #define vld2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  14497   float32x4x2_t __ret; \
  14498   float32x4x2_t __s1 = __p1; \
  14499   float32x4x2_t __rev1; \
  14500   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  14501   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  14502   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 41); \
  14503  \
  14504   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14505   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14506   __ret; \
  14507 })
  14508 #endif
  14509 
  14510 #ifdef __LITTLE_ENDIAN__
  14511 #define vld2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  14512   int32x4x2_t __ret; \
  14513   int32x4x2_t __s1 = __p1; \
  14514   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 34); \
  14515   __ret; \
  14516 })
  14517 #else
  14518 #define vld2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  14519   int32x4x2_t __ret; \
  14520   int32x4x2_t __s1 = __p1; \
  14521   int32x4x2_t __rev1; \
  14522   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  14523   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  14524   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 34); \
  14525  \
  14526   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14527   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14528   __ret; \
  14529 })
  14530 #endif
  14531 
  14532 #ifdef __LITTLE_ENDIAN__
  14533 #define vld2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  14534   int16x8x2_t __ret; \
  14535   int16x8x2_t __s1 = __p1; \
  14536   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 33); \
  14537   __ret; \
  14538 })
  14539 #else
  14540 #define vld2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  14541   int16x8x2_t __ret; \
  14542   int16x8x2_t __s1 = __p1; \
  14543   int16x8x2_t __rev1; \
  14544   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14545   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14546   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 33); \
  14547  \
  14548   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14549   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14550   __ret; \
  14551 })
  14552 #endif
  14553 
  14554 #ifdef __LITTLE_ENDIAN__
  14555 #define vld2_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  14556   uint8x8x2_t __ret; \
  14557   uint8x8x2_t __s1 = __p1; \
  14558   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 16); \
  14559   __ret; \
  14560 })
  14561 #else
  14562 #define vld2_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  14563   uint8x8x2_t __ret; \
  14564   uint8x8x2_t __s1 = __p1; \
  14565   uint8x8x2_t __rev1; \
  14566   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14567   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14568   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 16); \
  14569  \
  14570   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14571   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14572   __ret; \
  14573 })
  14574 #endif
  14575 
  14576 #ifdef __LITTLE_ENDIAN__
  14577 #define vld2_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  14578   uint32x2x2_t __ret; \
  14579   uint32x2x2_t __s1 = __p1; \
  14580   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 18); \
  14581   __ret; \
  14582 })
  14583 #else
  14584 #define vld2_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  14585   uint32x2x2_t __ret; \
  14586   uint32x2x2_t __s1 = __p1; \
  14587   uint32x2x2_t __rev1; \
  14588   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  14589   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  14590   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 18); \
  14591  \
  14592   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14593   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14594   __ret; \
  14595 })
  14596 #endif
  14597 
  14598 #ifdef __LITTLE_ENDIAN__
  14599 #define vld2_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  14600   uint16x4x2_t __ret; \
  14601   uint16x4x2_t __s1 = __p1; \
  14602   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 17); \
  14603   __ret; \
  14604 })
  14605 #else
  14606 #define vld2_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  14607   uint16x4x2_t __ret; \
  14608   uint16x4x2_t __s1 = __p1; \
  14609   uint16x4x2_t __rev1; \
  14610   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  14611   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  14612   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 17); \
  14613  \
  14614   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14615   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14616   __ret; \
  14617 })
  14618 #endif
  14619 
  14620 #ifdef __LITTLE_ENDIAN__
  14621 #define vld2_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  14622   int8x8x2_t __ret; \
  14623   int8x8x2_t __s1 = __p1; \
  14624   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 0); \
  14625   __ret; \
  14626 })
  14627 #else
  14628 #define vld2_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  14629   int8x8x2_t __ret; \
  14630   int8x8x2_t __s1 = __p1; \
  14631   int8x8x2_t __rev1; \
  14632   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14633   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14634   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 0); \
  14635  \
  14636   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14637   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14638   __ret; \
  14639 })
  14640 #endif
  14641 
  14642 #ifdef __LITTLE_ENDIAN__
  14643 #define vld2_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  14644   float32x2x2_t __ret; \
  14645   float32x2x2_t __s1 = __p1; \
  14646   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 9); \
  14647   __ret; \
  14648 })
  14649 #else
  14650 #define vld2_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  14651   float32x2x2_t __ret; \
  14652   float32x2x2_t __s1 = __p1; \
  14653   float32x2x2_t __rev1; \
  14654   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  14655   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  14656   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 9); \
  14657  \
  14658   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14659   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14660   __ret; \
  14661 })
  14662 #endif
  14663 
  14664 #ifdef __LITTLE_ENDIAN__
  14665 #define vld2_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  14666   int32x2x2_t __ret; \
  14667   int32x2x2_t __s1 = __p1; \
  14668   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 2); \
  14669   __ret; \
  14670 })
  14671 #else
  14672 #define vld2_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  14673   int32x2x2_t __ret; \
  14674   int32x2x2_t __s1 = __p1; \
  14675   int32x2x2_t __rev1; \
  14676   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  14677   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  14678   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 2); \
  14679  \
  14680   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14681   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14682   __ret; \
  14683 })
  14684 #endif
  14685 
  14686 #ifdef __LITTLE_ENDIAN__
  14687 #define vld2_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  14688   int16x4x2_t __ret; \
  14689   int16x4x2_t __s1 = __p1; \
  14690   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 1); \
  14691   __ret; \
  14692 })
  14693 #else
  14694 #define vld2_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  14695   int16x4x2_t __ret; \
  14696   int16x4x2_t __s1 = __p1; \
  14697   int16x4x2_t __rev1; \
  14698   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  14699   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  14700   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 1); \
  14701  \
  14702   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14703   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14704   __ret; \
  14705 })
  14706 #endif
  14707 
  14708 #ifdef __LITTLE_ENDIAN__
  14709 #define vld3_p8(__p0) __extension__ ({ \
  14710   poly8x8x3_t __ret; \
  14711   __builtin_neon_vld3_v(&__ret, __p0, 4); \
  14712   __ret; \
  14713 })
  14714 #else
  14715 #define vld3_p8(__p0) __extension__ ({ \
  14716   poly8x8x3_t __ret; \
  14717   __builtin_neon_vld3_v(&__ret, __p0, 4); \
  14718  \
  14719   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14720   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14721   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  14722   __ret; \
  14723 })
  14724 #endif
  14725 
  14726 #ifdef __LITTLE_ENDIAN__
  14727 #define vld3_p16(__p0) __extension__ ({ \
  14728   poly16x4x3_t __ret; \
  14729   __builtin_neon_vld3_v(&__ret, __p0, 5); \
  14730   __ret; \
  14731 })
  14732 #else
  14733 #define vld3_p16(__p0) __extension__ ({ \
  14734   poly16x4x3_t __ret; \
  14735   __builtin_neon_vld3_v(&__ret, __p0, 5); \
  14736  \
  14737   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14738   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14739   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  14740   __ret; \
  14741 })
  14742 #endif
  14743 
  14744 #ifdef __LITTLE_ENDIAN__
  14745 #define vld3q_p8(__p0) __extension__ ({ \
  14746   poly8x16x3_t __ret; \
  14747   __builtin_neon_vld3q_v(&__ret, __p0, 36); \
  14748   __ret; \
  14749 })
  14750 #else
  14751 #define vld3q_p8(__p0) __extension__ ({ \
  14752   poly8x16x3_t __ret; \
  14753   __builtin_neon_vld3q_v(&__ret, __p0, 36); \
  14754  \
  14755   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14756   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14757   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14758   __ret; \
  14759 })
  14760 #endif
  14761 
  14762 #ifdef __LITTLE_ENDIAN__
  14763 #define vld3q_p16(__p0) __extension__ ({ \
  14764   poly16x8x3_t __ret; \
  14765   __builtin_neon_vld3q_v(&__ret, __p0, 37); \
  14766   __ret; \
  14767 })
  14768 #else
  14769 #define vld3q_p16(__p0) __extension__ ({ \
  14770   poly16x8x3_t __ret; \
  14771   __builtin_neon_vld3q_v(&__ret, __p0, 37); \
  14772  \
  14773   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14774   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14775   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  14776   __ret; \
  14777 })
  14778 #endif
  14779 
  14780 #ifdef __LITTLE_ENDIAN__
  14781 #define vld3q_u8(__p0) __extension__ ({ \
  14782   uint8x16x3_t __ret; \
  14783   __builtin_neon_vld3q_v(&__ret, __p0, 48); \
  14784   __ret; \
  14785 })
  14786 #else
  14787 #define vld3q_u8(__p0) __extension__ ({ \
  14788   uint8x16x3_t __ret; \
  14789   __builtin_neon_vld3q_v(&__ret, __p0, 48); \
  14790  \
  14791   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14792   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14793   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14794   __ret; \
  14795 })
  14796 #endif
  14797 
  14798 #ifdef __LITTLE_ENDIAN__
  14799 #define vld3q_u32(__p0) __extension__ ({ \
  14800   uint32x4x3_t __ret; \
  14801   __builtin_neon_vld3q_v(&__ret, __p0, 50); \
  14802   __ret; \
  14803 })
  14804 #else
  14805 #define vld3q_u32(__p0) __extension__ ({ \
  14806   uint32x4x3_t __ret; \
  14807   __builtin_neon_vld3q_v(&__ret, __p0, 50); \
  14808  \
  14809   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14810   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14811   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  14812   __ret; \
  14813 })
  14814 #endif
  14815 
  14816 #ifdef __LITTLE_ENDIAN__
  14817 #define vld3q_u16(__p0) __extension__ ({ \
  14818   uint16x8x3_t __ret; \
  14819   __builtin_neon_vld3q_v(&__ret, __p0, 49); \
  14820   __ret; \
  14821 })
  14822 #else
  14823 #define vld3q_u16(__p0) __extension__ ({ \
  14824   uint16x8x3_t __ret; \
  14825   __builtin_neon_vld3q_v(&__ret, __p0, 49); \
  14826  \
  14827   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14828   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14829   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  14830   __ret; \
  14831 })
  14832 #endif
  14833 
  14834 #ifdef __LITTLE_ENDIAN__
  14835 #define vld3q_s8(__p0) __extension__ ({ \
  14836   int8x16x3_t __ret; \
  14837   __builtin_neon_vld3q_v(&__ret, __p0, 32); \
  14838   __ret; \
  14839 })
  14840 #else
  14841 #define vld3q_s8(__p0) __extension__ ({ \
  14842   int8x16x3_t __ret; \
  14843   __builtin_neon_vld3q_v(&__ret, __p0, 32); \
  14844  \
  14845   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14846   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14847   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  14848   __ret; \
  14849 })
  14850 #endif
  14851 
  14852 #ifdef __LITTLE_ENDIAN__
  14853 #define vld3q_f32(__p0) __extension__ ({ \
  14854   float32x4x3_t __ret; \
  14855   __builtin_neon_vld3q_v(&__ret, __p0, 41); \
  14856   __ret; \
  14857 })
  14858 #else
  14859 #define vld3q_f32(__p0) __extension__ ({ \
  14860   float32x4x3_t __ret; \
  14861   __builtin_neon_vld3q_v(&__ret, __p0, 41); \
  14862  \
  14863   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14864   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14865   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  14866   __ret; \
  14867 })
  14868 #endif
  14869 
  14870 #ifdef __LITTLE_ENDIAN__
  14871 #define vld3q_s32(__p0) __extension__ ({ \
  14872   int32x4x3_t __ret; \
  14873   __builtin_neon_vld3q_v(&__ret, __p0, 34); \
  14874   __ret; \
  14875 })
  14876 #else
  14877 #define vld3q_s32(__p0) __extension__ ({ \
  14878   int32x4x3_t __ret; \
  14879   __builtin_neon_vld3q_v(&__ret, __p0, 34); \
  14880  \
  14881   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14882   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14883   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  14884   __ret; \
  14885 })
  14886 #endif
  14887 
  14888 #ifdef __LITTLE_ENDIAN__
  14889 #define vld3q_s16(__p0) __extension__ ({ \
  14890   int16x8x3_t __ret; \
  14891   __builtin_neon_vld3q_v(&__ret, __p0, 33); \
  14892   __ret; \
  14893 })
  14894 #else
  14895 #define vld3q_s16(__p0) __extension__ ({ \
  14896   int16x8x3_t __ret; \
  14897   __builtin_neon_vld3q_v(&__ret, __p0, 33); \
  14898  \
  14899   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14900   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14901   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  14902   __ret; \
  14903 })
  14904 #endif
  14905 
  14906 #ifdef __LITTLE_ENDIAN__
  14907 #define vld3_u8(__p0) __extension__ ({ \
  14908   uint8x8x3_t __ret; \
  14909   __builtin_neon_vld3_v(&__ret, __p0, 16); \
  14910   __ret; \
  14911 })
  14912 #else
  14913 #define vld3_u8(__p0) __extension__ ({ \
  14914   uint8x8x3_t __ret; \
  14915   __builtin_neon_vld3_v(&__ret, __p0, 16); \
  14916  \
  14917   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14918   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14919   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  14920   __ret; \
  14921 })
  14922 #endif
  14923 
  14924 #ifdef __LITTLE_ENDIAN__
  14925 #define vld3_u32(__p0) __extension__ ({ \
  14926   uint32x2x3_t __ret; \
  14927   __builtin_neon_vld3_v(&__ret, __p0, 18); \
  14928   __ret; \
  14929 })
  14930 #else
  14931 #define vld3_u32(__p0) __extension__ ({ \
  14932   uint32x2x3_t __ret; \
  14933   __builtin_neon_vld3_v(&__ret, __p0, 18); \
  14934  \
  14935   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14936   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14937   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  14938   __ret; \
  14939 })
  14940 #endif
  14941 
  14942 #define vld3_u64(__p0) __extension__ ({ \
  14943   uint64x1x3_t __ret; \
  14944   __builtin_neon_vld3_v(&__ret, __p0, 19); \
  14945   __ret; \
  14946 })
  14947 #ifdef __LITTLE_ENDIAN__
  14948 #define vld3_u16(__p0) __extension__ ({ \
  14949   uint16x4x3_t __ret; \
  14950   __builtin_neon_vld3_v(&__ret, __p0, 17); \
  14951   __ret; \
  14952 })
  14953 #else
  14954 #define vld3_u16(__p0) __extension__ ({ \
  14955   uint16x4x3_t __ret; \
  14956   __builtin_neon_vld3_v(&__ret, __p0, 17); \
  14957  \
  14958   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  14959   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  14960   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  14961   __ret; \
  14962 })
  14963 #endif
  14964 
  14965 #ifdef __LITTLE_ENDIAN__
  14966 #define vld3_s8(__p0) __extension__ ({ \
  14967   int8x8x3_t __ret; \
  14968   __builtin_neon_vld3_v(&__ret, __p0, 0); \
  14969   __ret; \
  14970 })
  14971 #else
  14972 #define vld3_s8(__p0) __extension__ ({ \
  14973   int8x8x3_t __ret; \
  14974   __builtin_neon_vld3_v(&__ret, __p0, 0); \
  14975  \
  14976   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  14977   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  14978   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  14979   __ret; \
  14980 })
  14981 #endif
  14982 
  14983 #ifdef __LITTLE_ENDIAN__
  14984 #define vld3_f32(__p0) __extension__ ({ \
  14985   float32x2x3_t __ret; \
  14986   __builtin_neon_vld3_v(&__ret, __p0, 9); \
  14987   __ret; \
  14988 })
  14989 #else
  14990 #define vld3_f32(__p0) __extension__ ({ \
  14991   float32x2x3_t __ret; \
  14992   __builtin_neon_vld3_v(&__ret, __p0, 9); \
  14993  \
  14994   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  14995   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  14996   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  14997   __ret; \
  14998 })
  14999 #endif
  15000 
  15001 #ifdef __LITTLE_ENDIAN__
  15002 #define vld3_s32(__p0) __extension__ ({ \
  15003   int32x2x3_t __ret; \
  15004   __builtin_neon_vld3_v(&__ret, __p0, 2); \
  15005   __ret; \
  15006 })
  15007 #else
  15008 #define vld3_s32(__p0) __extension__ ({ \
  15009   int32x2x3_t __ret; \
  15010   __builtin_neon_vld3_v(&__ret, __p0, 2); \
  15011  \
  15012   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15013   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15014   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15015   __ret; \
  15016 })
  15017 #endif
  15018 
  15019 #define vld3_s64(__p0) __extension__ ({ \
  15020   int64x1x3_t __ret; \
  15021   __builtin_neon_vld3_v(&__ret, __p0, 3); \
  15022   __ret; \
  15023 })
  15024 #ifdef __LITTLE_ENDIAN__
  15025 #define vld3_s16(__p0) __extension__ ({ \
  15026   int16x4x3_t __ret; \
  15027   __builtin_neon_vld3_v(&__ret, __p0, 1); \
  15028   __ret; \
  15029 })
  15030 #else
  15031 #define vld3_s16(__p0) __extension__ ({ \
  15032   int16x4x3_t __ret; \
  15033   __builtin_neon_vld3_v(&__ret, __p0, 1); \
  15034  \
  15035   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15036   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15037   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15038   __ret; \
  15039 })
  15040 #endif
  15041 
  15042 #ifdef __LITTLE_ENDIAN__
  15043 #define vld3_dup_p8(__p0) __extension__ ({ \
  15044   poly8x8x3_t __ret; \
  15045   __builtin_neon_vld3_dup_v(&__ret, __p0, 4); \
  15046   __ret; \
  15047 })
  15048 #else
  15049 #define vld3_dup_p8(__p0) __extension__ ({ \
  15050   poly8x8x3_t __ret; \
  15051   __builtin_neon_vld3_dup_v(&__ret, __p0, 4); \
  15052  \
  15053   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15054   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15055   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15056   __ret; \
  15057 })
  15058 #endif
  15059 
  15060 #ifdef __LITTLE_ENDIAN__
  15061 #define vld3_dup_p16(__p0) __extension__ ({ \
  15062   poly16x4x3_t __ret; \
  15063   __builtin_neon_vld3_dup_v(&__ret, __p0, 5); \
  15064   __ret; \
  15065 })
  15066 #else
  15067 #define vld3_dup_p16(__p0) __extension__ ({ \
  15068   poly16x4x3_t __ret; \
  15069   __builtin_neon_vld3_dup_v(&__ret, __p0, 5); \
  15070  \
  15071   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15072   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15073   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15074   __ret; \
  15075 })
  15076 #endif
  15077 
  15078 #ifdef __LITTLE_ENDIAN__
  15079 #define vld3q_dup_p8(__p0) __extension__ ({ \
  15080   poly8x16x3_t __ret; \
  15081   __builtin_neon_vld3q_dup_v(&__ret, __p0, 36); \
  15082   __ret; \
  15083 })
  15084 #else
  15085 #define vld3q_dup_p8(__p0) __extension__ ({ \
  15086   poly8x16x3_t __ret; \
  15087   __builtin_neon_vld3q_dup_v(&__ret, __p0, 36); \
  15088  \
  15089   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15090   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15091   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15092   __ret; \
  15093 })
  15094 #endif
  15095 
  15096 #ifdef __LITTLE_ENDIAN__
  15097 #define vld3q_dup_p16(__p0) __extension__ ({ \
  15098   poly16x8x3_t __ret; \
  15099   __builtin_neon_vld3q_dup_v(&__ret, __p0, 37); \
  15100   __ret; \
  15101 })
  15102 #else
  15103 #define vld3q_dup_p16(__p0) __extension__ ({ \
  15104   poly16x8x3_t __ret; \
  15105   __builtin_neon_vld3q_dup_v(&__ret, __p0, 37); \
  15106  \
  15107   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15108   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15109   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15110   __ret; \
  15111 })
  15112 #endif
  15113 
  15114 #ifdef __LITTLE_ENDIAN__
  15115 #define vld3q_dup_u8(__p0) __extension__ ({ \
  15116   uint8x16x3_t __ret; \
  15117   __builtin_neon_vld3q_dup_v(&__ret, __p0, 48); \
  15118   __ret; \
  15119 })
  15120 #else
  15121 #define vld3q_dup_u8(__p0) __extension__ ({ \
  15122   uint8x16x3_t __ret; \
  15123   __builtin_neon_vld3q_dup_v(&__ret, __p0, 48); \
  15124  \
  15125   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15126   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15127   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15128   __ret; \
  15129 })
  15130 #endif
  15131 
  15132 #ifdef __LITTLE_ENDIAN__
  15133 #define vld3q_dup_u32(__p0) __extension__ ({ \
  15134   uint32x4x3_t __ret; \
  15135   __builtin_neon_vld3q_dup_v(&__ret, __p0, 50); \
  15136   __ret; \
  15137 })
  15138 #else
  15139 #define vld3q_dup_u32(__p0) __extension__ ({ \
  15140   uint32x4x3_t __ret; \
  15141   __builtin_neon_vld3q_dup_v(&__ret, __p0, 50); \
  15142  \
  15143   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15144   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15145   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15146   __ret; \
  15147 })
  15148 #endif
  15149 
  15150 #ifdef __LITTLE_ENDIAN__
  15151 #define vld3q_dup_u64(__p0) __extension__ ({ \
  15152   uint64x2x3_t __ret; \
  15153   __builtin_neon_vld3q_dup_v(&__ret, __p0, 51); \
  15154   __ret; \
  15155 })
  15156 #else
  15157 #define vld3q_dup_u64(__p0) __extension__ ({ \
  15158   uint64x2x3_t __ret; \
  15159   __builtin_neon_vld3q_dup_v(&__ret, __p0, 51); \
  15160  \
  15161   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15162   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15163   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15164   __ret; \
  15165 })
  15166 #endif
  15167 
  15168 #ifdef __LITTLE_ENDIAN__
  15169 #define vld3q_dup_u16(__p0) __extension__ ({ \
  15170   uint16x8x3_t __ret; \
  15171   __builtin_neon_vld3q_dup_v(&__ret, __p0, 49); \
  15172   __ret; \
  15173 })
  15174 #else
  15175 #define vld3q_dup_u16(__p0) __extension__ ({ \
  15176   uint16x8x3_t __ret; \
  15177   __builtin_neon_vld3q_dup_v(&__ret, __p0, 49); \
  15178  \
  15179   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15180   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15181   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15182   __ret; \
  15183 })
  15184 #endif
  15185 
  15186 #ifdef __LITTLE_ENDIAN__
  15187 #define vld3q_dup_s8(__p0) __extension__ ({ \
  15188   int8x16x3_t __ret; \
  15189   __builtin_neon_vld3q_dup_v(&__ret, __p0, 32); \
  15190   __ret; \
  15191 })
  15192 #else
  15193 #define vld3q_dup_s8(__p0) __extension__ ({ \
  15194   int8x16x3_t __ret; \
  15195   __builtin_neon_vld3q_dup_v(&__ret, __p0, 32); \
  15196  \
  15197   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15198   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15199   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15200   __ret; \
  15201 })
  15202 #endif
  15203 
  15204 #ifdef __LITTLE_ENDIAN__
  15205 #define vld3q_dup_f32(__p0) __extension__ ({ \
  15206   float32x4x3_t __ret; \
  15207   __builtin_neon_vld3q_dup_v(&__ret, __p0, 41); \
  15208   __ret; \
  15209 })
  15210 #else
  15211 #define vld3q_dup_f32(__p0) __extension__ ({ \
  15212   float32x4x3_t __ret; \
  15213   __builtin_neon_vld3q_dup_v(&__ret, __p0, 41); \
  15214  \
  15215   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15216   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15217   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15218   __ret; \
  15219 })
  15220 #endif
  15221 
  15222 #ifdef __LITTLE_ENDIAN__
  15223 #define vld3q_dup_s32(__p0) __extension__ ({ \
  15224   int32x4x3_t __ret; \
  15225   __builtin_neon_vld3q_dup_v(&__ret, __p0, 34); \
  15226   __ret; \
  15227 })
  15228 #else
  15229 #define vld3q_dup_s32(__p0) __extension__ ({ \
  15230   int32x4x3_t __ret; \
  15231   __builtin_neon_vld3q_dup_v(&__ret, __p0, 34); \
  15232  \
  15233   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15234   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15235   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15236   __ret; \
  15237 })
  15238 #endif
  15239 
  15240 #ifdef __LITTLE_ENDIAN__
  15241 #define vld3q_dup_s64(__p0) __extension__ ({ \
  15242   int64x2x3_t __ret; \
  15243   __builtin_neon_vld3q_dup_v(&__ret, __p0, 35); \
  15244   __ret; \
  15245 })
  15246 #else
  15247 #define vld3q_dup_s64(__p0) __extension__ ({ \
  15248   int64x2x3_t __ret; \
  15249   __builtin_neon_vld3q_dup_v(&__ret, __p0, 35); \
  15250  \
  15251   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15252   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15253   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15254   __ret; \
  15255 })
  15256 #endif
  15257 
  15258 #ifdef __LITTLE_ENDIAN__
  15259 #define vld3q_dup_s16(__p0) __extension__ ({ \
  15260   int16x8x3_t __ret; \
  15261   __builtin_neon_vld3q_dup_v(&__ret, __p0, 33); \
  15262   __ret; \
  15263 })
  15264 #else
  15265 #define vld3q_dup_s16(__p0) __extension__ ({ \
  15266   int16x8x3_t __ret; \
  15267   __builtin_neon_vld3q_dup_v(&__ret, __p0, 33); \
  15268  \
  15269   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15270   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15271   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15272   __ret; \
  15273 })
  15274 #endif
  15275 
  15276 #ifdef __LITTLE_ENDIAN__
  15277 #define vld3_dup_u8(__p0) __extension__ ({ \
  15278   uint8x8x3_t __ret; \
  15279   __builtin_neon_vld3_dup_v(&__ret, __p0, 16); \
  15280   __ret; \
  15281 })
  15282 #else
  15283 #define vld3_dup_u8(__p0) __extension__ ({ \
  15284   uint8x8x3_t __ret; \
  15285   __builtin_neon_vld3_dup_v(&__ret, __p0, 16); \
  15286  \
  15287   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15288   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15289   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15290   __ret; \
  15291 })
  15292 #endif
  15293 
  15294 #ifdef __LITTLE_ENDIAN__
  15295 #define vld3_dup_u32(__p0) __extension__ ({ \
  15296   uint32x2x3_t __ret; \
  15297   __builtin_neon_vld3_dup_v(&__ret, __p0, 18); \
  15298   __ret; \
  15299 })
  15300 #else
  15301 #define vld3_dup_u32(__p0) __extension__ ({ \
  15302   uint32x2x3_t __ret; \
  15303   __builtin_neon_vld3_dup_v(&__ret, __p0, 18); \
  15304  \
  15305   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15306   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15307   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15308   __ret; \
  15309 })
  15310 #endif
  15311 
  15312 #define vld3_dup_u64(__p0) __extension__ ({ \
  15313   uint64x1x3_t __ret; \
  15314   __builtin_neon_vld3_dup_v(&__ret, __p0, 19); \
  15315   __ret; \
  15316 })
  15317 #ifdef __LITTLE_ENDIAN__
  15318 #define vld3_dup_u16(__p0) __extension__ ({ \
  15319   uint16x4x3_t __ret; \
  15320   __builtin_neon_vld3_dup_v(&__ret, __p0, 17); \
  15321   __ret; \
  15322 })
  15323 #else
  15324 #define vld3_dup_u16(__p0) __extension__ ({ \
  15325   uint16x4x3_t __ret; \
  15326   __builtin_neon_vld3_dup_v(&__ret, __p0, 17); \
  15327  \
  15328   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15329   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15330   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15331   __ret; \
  15332 })
  15333 #endif
  15334 
  15335 #ifdef __LITTLE_ENDIAN__
  15336 #define vld3_dup_s8(__p0) __extension__ ({ \
  15337   int8x8x3_t __ret; \
  15338   __builtin_neon_vld3_dup_v(&__ret, __p0, 0); \
  15339   __ret; \
  15340 })
  15341 #else
  15342 #define vld3_dup_s8(__p0) __extension__ ({ \
  15343   int8x8x3_t __ret; \
  15344   __builtin_neon_vld3_dup_v(&__ret, __p0, 0); \
  15345  \
  15346   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15347   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15348   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15349   __ret; \
  15350 })
  15351 #endif
  15352 
  15353 #ifdef __LITTLE_ENDIAN__
  15354 #define vld3_dup_f32(__p0) __extension__ ({ \
  15355   float32x2x3_t __ret; \
  15356   __builtin_neon_vld3_dup_v(&__ret, __p0, 9); \
  15357   __ret; \
  15358 })
  15359 #else
  15360 #define vld3_dup_f32(__p0) __extension__ ({ \
  15361   float32x2x3_t __ret; \
  15362   __builtin_neon_vld3_dup_v(&__ret, __p0, 9); \
  15363  \
  15364   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15365   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15366   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15367   __ret; \
  15368 })
  15369 #endif
  15370 
  15371 #ifdef __LITTLE_ENDIAN__
  15372 #define vld3_dup_s32(__p0) __extension__ ({ \
  15373   int32x2x3_t __ret; \
  15374   __builtin_neon_vld3_dup_v(&__ret, __p0, 2); \
  15375   __ret; \
  15376 })
  15377 #else
  15378 #define vld3_dup_s32(__p0) __extension__ ({ \
  15379   int32x2x3_t __ret; \
  15380   __builtin_neon_vld3_dup_v(&__ret, __p0, 2); \
  15381  \
  15382   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15383   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15384   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15385   __ret; \
  15386 })
  15387 #endif
  15388 
  15389 #define vld3_dup_s64(__p0) __extension__ ({ \
  15390   int64x1x3_t __ret; \
  15391   __builtin_neon_vld3_dup_v(&__ret, __p0, 3); \
  15392   __ret; \
  15393 })
  15394 #ifdef __LITTLE_ENDIAN__
  15395 #define vld3_dup_s16(__p0) __extension__ ({ \
  15396   int16x4x3_t __ret; \
  15397   __builtin_neon_vld3_dup_v(&__ret, __p0, 1); \
  15398   __ret; \
  15399 })
  15400 #else
  15401 #define vld3_dup_s16(__p0) __extension__ ({ \
  15402   int16x4x3_t __ret; \
  15403   __builtin_neon_vld3_dup_v(&__ret, __p0, 1); \
  15404  \
  15405   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15406   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15407   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15408   __ret; \
  15409 })
  15410 #endif
  15411 
  15412 #ifdef __LITTLE_ENDIAN__
  15413 #define vld3_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  15414   poly8x8x3_t __ret; \
  15415   poly8x8x3_t __s1 = __p1; \
  15416   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 4); \
  15417   __ret; \
  15418 })
  15419 #else
  15420 #define vld3_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  15421   poly8x8x3_t __ret; \
  15422   poly8x8x3_t __s1 = __p1; \
  15423   poly8x8x3_t __rev1; \
  15424   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15425   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15426   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15427   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 4); \
  15428  \
  15429   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15430   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15431   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15432   __ret; \
  15433 })
  15434 #endif
  15435 
  15436 #ifdef __LITTLE_ENDIAN__
  15437 #define vld3_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  15438   poly16x4x3_t __ret; \
  15439   poly16x4x3_t __s1 = __p1; \
  15440   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 5); \
  15441   __ret; \
  15442 })
  15443 #else
  15444 #define vld3_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  15445   poly16x4x3_t __ret; \
  15446   poly16x4x3_t __s1 = __p1; \
  15447   poly16x4x3_t __rev1; \
  15448   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  15449   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  15450   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  15451   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 5); \
  15452  \
  15453   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15454   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15455   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15456   __ret; \
  15457 })
  15458 #endif
  15459 
  15460 #ifdef __LITTLE_ENDIAN__
  15461 #define vld3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  15462   poly16x8x3_t __ret; \
  15463   poly16x8x3_t __s1 = __p1; \
  15464   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 37); \
  15465   __ret; \
  15466 })
  15467 #else
  15468 #define vld3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  15469   poly16x8x3_t __ret; \
  15470   poly16x8x3_t __s1 = __p1; \
  15471   poly16x8x3_t __rev1; \
  15472   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15473   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15474   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15475   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 37); \
  15476  \
  15477   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15478   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15479   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15480   __ret; \
  15481 })
  15482 #endif
  15483 
  15484 #ifdef __LITTLE_ENDIAN__
  15485 #define vld3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  15486   uint32x4x3_t __ret; \
  15487   uint32x4x3_t __s1 = __p1; \
  15488   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 50); \
  15489   __ret; \
  15490 })
  15491 #else
  15492 #define vld3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  15493   uint32x4x3_t __ret; \
  15494   uint32x4x3_t __s1 = __p1; \
  15495   uint32x4x3_t __rev1; \
  15496   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  15497   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  15498   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  15499   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 50); \
  15500  \
  15501   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15502   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15503   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15504   __ret; \
  15505 })
  15506 #endif
  15507 
  15508 #ifdef __LITTLE_ENDIAN__
  15509 #define vld3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  15510   uint16x8x3_t __ret; \
  15511   uint16x8x3_t __s1 = __p1; \
  15512   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 49); \
  15513   __ret; \
  15514 })
  15515 #else
  15516 #define vld3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  15517   uint16x8x3_t __ret; \
  15518   uint16x8x3_t __s1 = __p1; \
  15519   uint16x8x3_t __rev1; \
  15520   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15521   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15522   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15523   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 49); \
  15524  \
  15525   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15526   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15527   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15528   __ret; \
  15529 })
  15530 #endif
  15531 
  15532 #ifdef __LITTLE_ENDIAN__
  15533 #define vld3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  15534   float32x4x3_t __ret; \
  15535   float32x4x3_t __s1 = __p1; \
  15536   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 41); \
  15537   __ret; \
  15538 })
  15539 #else
  15540 #define vld3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  15541   float32x4x3_t __ret; \
  15542   float32x4x3_t __s1 = __p1; \
  15543   float32x4x3_t __rev1; \
  15544   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  15545   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  15546   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  15547   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 41); \
  15548  \
  15549   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15550   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15551   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15552   __ret; \
  15553 })
  15554 #endif
  15555 
  15556 #ifdef __LITTLE_ENDIAN__
  15557 #define vld3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  15558   int32x4x3_t __ret; \
  15559   int32x4x3_t __s1 = __p1; \
  15560   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 34); \
  15561   __ret; \
  15562 })
  15563 #else
  15564 #define vld3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  15565   int32x4x3_t __ret; \
  15566   int32x4x3_t __s1 = __p1; \
  15567   int32x4x3_t __rev1; \
  15568   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  15569   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  15570   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  15571   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 34); \
  15572  \
  15573   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15574   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15575   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15576   __ret; \
  15577 })
  15578 #endif
  15579 
  15580 #ifdef __LITTLE_ENDIAN__
  15581 #define vld3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  15582   int16x8x3_t __ret; \
  15583   int16x8x3_t __s1 = __p1; \
  15584   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 33); \
  15585   __ret; \
  15586 })
  15587 #else
  15588 #define vld3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  15589   int16x8x3_t __ret; \
  15590   int16x8x3_t __s1 = __p1; \
  15591   int16x8x3_t __rev1; \
  15592   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15593   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15594   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15595   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 33); \
  15596  \
  15597   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15598   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15599   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15600   __ret; \
  15601 })
  15602 #endif
  15603 
  15604 #ifdef __LITTLE_ENDIAN__
  15605 #define vld3_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  15606   uint8x8x3_t __ret; \
  15607   uint8x8x3_t __s1 = __p1; \
  15608   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 16); \
  15609   __ret; \
  15610 })
  15611 #else
  15612 #define vld3_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  15613   uint8x8x3_t __ret; \
  15614   uint8x8x3_t __s1 = __p1; \
  15615   uint8x8x3_t __rev1; \
  15616   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15617   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15618   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15619   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 16); \
  15620  \
  15621   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15622   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15623   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15624   __ret; \
  15625 })
  15626 #endif
  15627 
  15628 #ifdef __LITTLE_ENDIAN__
  15629 #define vld3_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  15630   uint32x2x3_t __ret; \
  15631   uint32x2x3_t __s1 = __p1; \
  15632   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 18); \
  15633   __ret; \
  15634 })
  15635 #else
  15636 #define vld3_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  15637   uint32x2x3_t __ret; \
  15638   uint32x2x3_t __s1 = __p1; \
  15639   uint32x2x3_t __rev1; \
  15640   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  15641   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  15642   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  15643   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 18); \
  15644  \
  15645   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15646   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15647   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15648   __ret; \
  15649 })
  15650 #endif
  15651 
  15652 #ifdef __LITTLE_ENDIAN__
  15653 #define vld3_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  15654   uint16x4x3_t __ret; \
  15655   uint16x4x3_t __s1 = __p1; \
  15656   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 17); \
  15657   __ret; \
  15658 })
  15659 #else
  15660 #define vld3_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  15661   uint16x4x3_t __ret; \
  15662   uint16x4x3_t __s1 = __p1; \
  15663   uint16x4x3_t __rev1; \
  15664   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  15665   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  15666   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  15667   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 17); \
  15668  \
  15669   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15670   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15671   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15672   __ret; \
  15673 })
  15674 #endif
  15675 
  15676 #ifdef __LITTLE_ENDIAN__
  15677 #define vld3_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  15678   int8x8x3_t __ret; \
  15679   int8x8x3_t __s1 = __p1; \
  15680   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 0); \
  15681   __ret; \
  15682 })
  15683 #else
  15684 #define vld3_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  15685   int8x8x3_t __ret; \
  15686   int8x8x3_t __s1 = __p1; \
  15687   int8x8x3_t __rev1; \
  15688   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15689   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15690   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15691   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 0); \
  15692  \
  15693   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15694   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15695   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15696   __ret; \
  15697 })
  15698 #endif
  15699 
  15700 #ifdef __LITTLE_ENDIAN__
  15701 #define vld3_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  15702   float32x2x3_t __ret; \
  15703   float32x2x3_t __s1 = __p1; \
  15704   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 9); \
  15705   __ret; \
  15706 })
  15707 #else
  15708 #define vld3_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  15709   float32x2x3_t __ret; \
  15710   float32x2x3_t __s1 = __p1; \
  15711   float32x2x3_t __rev1; \
  15712   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  15713   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  15714   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  15715   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 9); \
  15716  \
  15717   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15718   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15719   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15720   __ret; \
  15721 })
  15722 #endif
  15723 
  15724 #ifdef __LITTLE_ENDIAN__
  15725 #define vld3_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  15726   int32x2x3_t __ret; \
  15727   int32x2x3_t __s1 = __p1; \
  15728   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 2); \
  15729   __ret; \
  15730 })
  15731 #else
  15732 #define vld3_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  15733   int32x2x3_t __ret; \
  15734   int32x2x3_t __s1 = __p1; \
  15735   int32x2x3_t __rev1; \
  15736   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  15737   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  15738   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  15739   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 2); \
  15740  \
  15741   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  15742   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  15743   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  15744   __ret; \
  15745 })
  15746 #endif
  15747 
  15748 #ifdef __LITTLE_ENDIAN__
  15749 #define vld3_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  15750   int16x4x3_t __ret; \
  15751   int16x4x3_t __s1 = __p1; \
  15752   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 1); \
  15753   __ret; \
  15754 })
  15755 #else
  15756 #define vld3_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  15757   int16x4x3_t __ret; \
  15758   int16x4x3_t __s1 = __p1; \
  15759   int16x4x3_t __rev1; \
  15760   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  15761   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  15762   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  15763   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 1); \
  15764  \
  15765   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15766   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15767   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15768   __ret; \
  15769 })
  15770 #endif
  15771 
  15772 #ifdef __LITTLE_ENDIAN__
  15773 #define vld4_p8(__p0) __extension__ ({ \
  15774   poly8x8x4_t __ret; \
  15775   __builtin_neon_vld4_v(&__ret, __p0, 4); \
  15776   __ret; \
  15777 })
  15778 #else
  15779 #define vld4_p8(__p0) __extension__ ({ \
  15780   poly8x8x4_t __ret; \
  15781   __builtin_neon_vld4_v(&__ret, __p0, 4); \
  15782  \
  15783   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15784   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15785   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15786   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  15787   __ret; \
  15788 })
  15789 #endif
  15790 
  15791 #ifdef __LITTLE_ENDIAN__
  15792 #define vld4_p16(__p0) __extension__ ({ \
  15793   poly16x4x4_t __ret; \
  15794   __builtin_neon_vld4_v(&__ret, __p0, 5); \
  15795   __ret; \
  15796 })
  15797 #else
  15798 #define vld4_p16(__p0) __extension__ ({ \
  15799   poly16x4x4_t __ret; \
  15800   __builtin_neon_vld4_v(&__ret, __p0, 5); \
  15801  \
  15802   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15803   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15804   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15805   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  15806   __ret; \
  15807 })
  15808 #endif
  15809 
  15810 #ifdef __LITTLE_ENDIAN__
  15811 #define vld4q_p8(__p0) __extension__ ({ \
  15812   poly8x16x4_t __ret; \
  15813   __builtin_neon_vld4q_v(&__ret, __p0, 36); \
  15814   __ret; \
  15815 })
  15816 #else
  15817 #define vld4q_p8(__p0) __extension__ ({ \
  15818   poly8x16x4_t __ret; \
  15819   __builtin_neon_vld4q_v(&__ret, __p0, 36); \
  15820  \
  15821   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15822   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15823   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15824   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15825   __ret; \
  15826 })
  15827 #endif
  15828 
  15829 #ifdef __LITTLE_ENDIAN__
  15830 #define vld4q_p16(__p0) __extension__ ({ \
  15831   poly16x8x4_t __ret; \
  15832   __builtin_neon_vld4q_v(&__ret, __p0, 37); \
  15833   __ret; \
  15834 })
  15835 #else
  15836 #define vld4q_p16(__p0) __extension__ ({ \
  15837   poly16x8x4_t __ret; \
  15838   __builtin_neon_vld4q_v(&__ret, __p0, 37); \
  15839  \
  15840   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15841   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15842   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15843   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  15844   __ret; \
  15845 })
  15846 #endif
  15847 
  15848 #ifdef __LITTLE_ENDIAN__
  15849 #define vld4q_u8(__p0) __extension__ ({ \
  15850   uint8x16x4_t __ret; \
  15851   __builtin_neon_vld4q_v(&__ret, __p0, 48); \
  15852   __ret; \
  15853 })
  15854 #else
  15855 #define vld4q_u8(__p0) __extension__ ({ \
  15856   uint8x16x4_t __ret; \
  15857   __builtin_neon_vld4q_v(&__ret, __p0, 48); \
  15858  \
  15859   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15860   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15861   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15862   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15863   __ret; \
  15864 })
  15865 #endif
  15866 
  15867 #ifdef __LITTLE_ENDIAN__
  15868 #define vld4q_u32(__p0) __extension__ ({ \
  15869   uint32x4x4_t __ret; \
  15870   __builtin_neon_vld4q_v(&__ret, __p0, 50); \
  15871   __ret; \
  15872 })
  15873 #else
  15874 #define vld4q_u32(__p0) __extension__ ({ \
  15875   uint32x4x4_t __ret; \
  15876   __builtin_neon_vld4q_v(&__ret, __p0, 50); \
  15877  \
  15878   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15879   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15880   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15881   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  15882   __ret; \
  15883 })
  15884 #endif
  15885 
  15886 #ifdef __LITTLE_ENDIAN__
  15887 #define vld4q_u16(__p0) __extension__ ({ \
  15888   uint16x8x4_t __ret; \
  15889   __builtin_neon_vld4q_v(&__ret, __p0, 49); \
  15890   __ret; \
  15891 })
  15892 #else
  15893 #define vld4q_u16(__p0) __extension__ ({ \
  15894   uint16x8x4_t __ret; \
  15895   __builtin_neon_vld4q_v(&__ret, __p0, 49); \
  15896  \
  15897   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15898   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15899   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15900   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  15901   __ret; \
  15902 })
  15903 #endif
  15904 
  15905 #ifdef __LITTLE_ENDIAN__
  15906 #define vld4q_s8(__p0) __extension__ ({ \
  15907   int8x16x4_t __ret; \
  15908   __builtin_neon_vld4q_v(&__ret, __p0, 32); \
  15909   __ret; \
  15910 })
  15911 #else
  15912 #define vld4q_s8(__p0) __extension__ ({ \
  15913   int8x16x4_t __ret; \
  15914   __builtin_neon_vld4q_v(&__ret, __p0, 32); \
  15915  \
  15916   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15917   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15918   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15919   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  15920   __ret; \
  15921 })
  15922 #endif
  15923 
  15924 #ifdef __LITTLE_ENDIAN__
  15925 #define vld4q_f32(__p0) __extension__ ({ \
  15926   float32x4x4_t __ret; \
  15927   __builtin_neon_vld4q_v(&__ret, __p0, 41); \
  15928   __ret; \
  15929 })
  15930 #else
  15931 #define vld4q_f32(__p0) __extension__ ({ \
  15932   float32x4x4_t __ret; \
  15933   __builtin_neon_vld4q_v(&__ret, __p0, 41); \
  15934  \
  15935   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15936   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15937   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15938   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  15939   __ret; \
  15940 })
  15941 #endif
  15942 
  15943 #ifdef __LITTLE_ENDIAN__
  15944 #define vld4q_s32(__p0) __extension__ ({ \
  15945   int32x4x4_t __ret; \
  15946   __builtin_neon_vld4q_v(&__ret, __p0, 34); \
  15947   __ret; \
  15948 })
  15949 #else
  15950 #define vld4q_s32(__p0) __extension__ ({ \
  15951   int32x4x4_t __ret; \
  15952   __builtin_neon_vld4q_v(&__ret, __p0, 34); \
  15953  \
  15954   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  15955   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  15956   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  15957   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  15958   __ret; \
  15959 })
  15960 #endif
  15961 
  15962 #ifdef __LITTLE_ENDIAN__
  15963 #define vld4q_s16(__p0) __extension__ ({ \
  15964   int16x8x4_t __ret; \
  15965   __builtin_neon_vld4q_v(&__ret, __p0, 33); \
  15966   __ret; \
  15967 })
  15968 #else
  15969 #define vld4q_s16(__p0) __extension__ ({ \
  15970   int16x8x4_t __ret; \
  15971   __builtin_neon_vld4q_v(&__ret, __p0, 33); \
  15972  \
  15973   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15974   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15975   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15976   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  15977   __ret; \
  15978 })
  15979 #endif
  15980 
  15981 #ifdef __LITTLE_ENDIAN__
  15982 #define vld4_u8(__p0) __extension__ ({ \
  15983   uint8x8x4_t __ret; \
  15984   __builtin_neon_vld4_v(&__ret, __p0, 16); \
  15985   __ret; \
  15986 })
  15987 #else
  15988 #define vld4_u8(__p0) __extension__ ({ \
  15989   uint8x8x4_t __ret; \
  15990   __builtin_neon_vld4_v(&__ret, __p0, 16); \
  15991  \
  15992   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  15993   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  15994   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  15995   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  15996   __ret; \
  15997 })
  15998 #endif
  15999 
  16000 #ifdef __LITTLE_ENDIAN__
  16001 #define vld4_u32(__p0) __extension__ ({ \
  16002   uint32x2x4_t __ret; \
  16003   __builtin_neon_vld4_v(&__ret, __p0, 18); \
  16004   __ret; \
  16005 })
  16006 #else
  16007 #define vld4_u32(__p0) __extension__ ({ \
  16008   uint32x2x4_t __ret; \
  16009   __builtin_neon_vld4_v(&__ret, __p0, 18); \
  16010  \
  16011   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16012   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16013   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16014   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16015   __ret; \
  16016 })
  16017 #endif
  16018 
  16019 #define vld4_u64(__p0) __extension__ ({ \
  16020   uint64x1x4_t __ret; \
  16021   __builtin_neon_vld4_v(&__ret, __p0, 19); \
  16022   __ret; \
  16023 })
  16024 #ifdef __LITTLE_ENDIAN__
  16025 #define vld4_u16(__p0) __extension__ ({ \
  16026   uint16x4x4_t __ret; \
  16027   __builtin_neon_vld4_v(&__ret, __p0, 17); \
  16028   __ret; \
  16029 })
  16030 #else
  16031 #define vld4_u16(__p0) __extension__ ({ \
  16032   uint16x4x4_t __ret; \
  16033   __builtin_neon_vld4_v(&__ret, __p0, 17); \
  16034  \
  16035   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16036   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16037   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16038   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16039   __ret; \
  16040 })
  16041 #endif
  16042 
  16043 #ifdef __LITTLE_ENDIAN__
  16044 #define vld4_s8(__p0) __extension__ ({ \
  16045   int8x8x4_t __ret; \
  16046   __builtin_neon_vld4_v(&__ret, __p0, 0); \
  16047   __ret; \
  16048 })
  16049 #else
  16050 #define vld4_s8(__p0) __extension__ ({ \
  16051   int8x8x4_t __ret; \
  16052   __builtin_neon_vld4_v(&__ret, __p0, 0); \
  16053  \
  16054   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16055   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16056   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16057   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16058   __ret; \
  16059 })
  16060 #endif
  16061 
  16062 #ifdef __LITTLE_ENDIAN__
  16063 #define vld4_f32(__p0) __extension__ ({ \
  16064   float32x2x4_t __ret; \
  16065   __builtin_neon_vld4_v(&__ret, __p0, 9); \
  16066   __ret; \
  16067 })
  16068 #else
  16069 #define vld4_f32(__p0) __extension__ ({ \
  16070   float32x2x4_t __ret; \
  16071   __builtin_neon_vld4_v(&__ret, __p0, 9); \
  16072  \
  16073   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16074   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16075   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16076   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16077   __ret; \
  16078 })
  16079 #endif
  16080 
  16081 #ifdef __LITTLE_ENDIAN__
  16082 #define vld4_s32(__p0) __extension__ ({ \
  16083   int32x2x4_t __ret; \
  16084   __builtin_neon_vld4_v(&__ret, __p0, 2); \
  16085   __ret; \
  16086 })
  16087 #else
  16088 #define vld4_s32(__p0) __extension__ ({ \
  16089   int32x2x4_t __ret; \
  16090   __builtin_neon_vld4_v(&__ret, __p0, 2); \
  16091  \
  16092   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16093   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16094   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16095   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16096   __ret; \
  16097 })
  16098 #endif
  16099 
  16100 #define vld4_s64(__p0) __extension__ ({ \
  16101   int64x1x4_t __ret; \
  16102   __builtin_neon_vld4_v(&__ret, __p0, 3); \
  16103   __ret; \
  16104 })
  16105 #ifdef __LITTLE_ENDIAN__
  16106 #define vld4_s16(__p0) __extension__ ({ \
  16107   int16x4x4_t __ret; \
  16108   __builtin_neon_vld4_v(&__ret, __p0, 1); \
  16109   __ret; \
  16110 })
  16111 #else
  16112 #define vld4_s16(__p0) __extension__ ({ \
  16113   int16x4x4_t __ret; \
  16114   __builtin_neon_vld4_v(&__ret, __p0, 1); \
  16115  \
  16116   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16117   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16118   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16119   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16120   __ret; \
  16121 })
  16122 #endif
  16123 
  16124 #ifdef __LITTLE_ENDIAN__
  16125 #define vld4_dup_p8(__p0) __extension__ ({ \
  16126   poly8x8x4_t __ret; \
  16127   __builtin_neon_vld4_dup_v(&__ret, __p0, 4); \
  16128   __ret; \
  16129 })
  16130 #else
  16131 #define vld4_dup_p8(__p0) __extension__ ({ \
  16132   poly8x8x4_t __ret; \
  16133   __builtin_neon_vld4_dup_v(&__ret, __p0, 4); \
  16134  \
  16135   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16136   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16137   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16138   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16139   __ret; \
  16140 })
  16141 #endif
  16142 
  16143 #ifdef __LITTLE_ENDIAN__
  16144 #define vld4_dup_p16(__p0) __extension__ ({ \
  16145   poly16x4x4_t __ret; \
  16146   __builtin_neon_vld4_dup_v(&__ret, __p0, 5); \
  16147   __ret; \
  16148 })
  16149 #else
  16150 #define vld4_dup_p16(__p0) __extension__ ({ \
  16151   poly16x4x4_t __ret; \
  16152   __builtin_neon_vld4_dup_v(&__ret, __p0, 5); \
  16153  \
  16154   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16155   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16156   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16157   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16158   __ret; \
  16159 })
  16160 #endif
  16161 
  16162 #ifdef __LITTLE_ENDIAN__
  16163 #define vld4q_dup_p8(__p0) __extension__ ({ \
  16164   poly8x16x4_t __ret; \
  16165   __builtin_neon_vld4q_dup_v(&__ret, __p0, 36); \
  16166   __ret; \
  16167 })
  16168 #else
  16169 #define vld4q_dup_p8(__p0) __extension__ ({ \
  16170   poly8x16x4_t __ret; \
  16171   __builtin_neon_vld4q_dup_v(&__ret, __p0, 36); \
  16172  \
  16173   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16174   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16175   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16176   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16177   __ret; \
  16178 })
  16179 #endif
  16180 
  16181 #ifdef __LITTLE_ENDIAN__
  16182 #define vld4q_dup_p16(__p0) __extension__ ({ \
  16183   poly16x8x4_t __ret; \
  16184   __builtin_neon_vld4q_dup_v(&__ret, __p0, 37); \
  16185   __ret; \
  16186 })
  16187 #else
  16188 #define vld4q_dup_p16(__p0) __extension__ ({ \
  16189   poly16x8x4_t __ret; \
  16190   __builtin_neon_vld4q_dup_v(&__ret, __p0, 37); \
  16191  \
  16192   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16193   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16194   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16195   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16196   __ret; \
  16197 })
  16198 #endif
  16199 
  16200 #ifdef __LITTLE_ENDIAN__
  16201 #define vld4q_dup_u8(__p0) __extension__ ({ \
  16202   uint8x16x4_t __ret; \
  16203   __builtin_neon_vld4q_dup_v(&__ret, __p0, 48); \
  16204   __ret; \
  16205 })
  16206 #else
  16207 #define vld4q_dup_u8(__p0) __extension__ ({ \
  16208   uint8x16x4_t __ret; \
  16209   __builtin_neon_vld4q_dup_v(&__ret, __p0, 48); \
  16210  \
  16211   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16212   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16213   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16214   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16215   __ret; \
  16216 })
  16217 #endif
  16218 
  16219 #ifdef __LITTLE_ENDIAN__
  16220 #define vld4q_dup_u32(__p0) __extension__ ({ \
  16221   uint32x4x4_t __ret; \
  16222   __builtin_neon_vld4q_dup_v(&__ret, __p0, 50); \
  16223   __ret; \
  16224 })
  16225 #else
  16226 #define vld4q_dup_u32(__p0) __extension__ ({ \
  16227   uint32x4x4_t __ret; \
  16228   __builtin_neon_vld4q_dup_v(&__ret, __p0, 50); \
  16229  \
  16230   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16231   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16232   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16233   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16234   __ret; \
  16235 })
  16236 #endif
  16237 
  16238 #ifdef __LITTLE_ENDIAN__
  16239 #define vld4q_dup_u64(__p0) __extension__ ({ \
  16240   uint64x2x4_t __ret; \
  16241   __builtin_neon_vld4q_dup_v(&__ret, __p0, 51); \
  16242   __ret; \
  16243 })
  16244 #else
  16245 #define vld4q_dup_u64(__p0) __extension__ ({ \
  16246   uint64x2x4_t __ret; \
  16247   __builtin_neon_vld4q_dup_v(&__ret, __p0, 51); \
  16248  \
  16249   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16250   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16251   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16252   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16253   __ret; \
  16254 })
  16255 #endif
  16256 
  16257 #ifdef __LITTLE_ENDIAN__
  16258 #define vld4q_dup_u16(__p0) __extension__ ({ \
  16259   uint16x8x4_t __ret; \
  16260   __builtin_neon_vld4q_dup_v(&__ret, __p0, 49); \
  16261   __ret; \
  16262 })
  16263 #else
  16264 #define vld4q_dup_u16(__p0) __extension__ ({ \
  16265   uint16x8x4_t __ret; \
  16266   __builtin_neon_vld4q_dup_v(&__ret, __p0, 49); \
  16267  \
  16268   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16269   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16270   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16271   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16272   __ret; \
  16273 })
  16274 #endif
  16275 
  16276 #ifdef __LITTLE_ENDIAN__
  16277 #define vld4q_dup_s8(__p0) __extension__ ({ \
  16278   int8x16x4_t __ret; \
  16279   __builtin_neon_vld4q_dup_v(&__ret, __p0, 32); \
  16280   __ret; \
  16281 })
  16282 #else
  16283 #define vld4q_dup_s8(__p0) __extension__ ({ \
  16284   int8x16x4_t __ret; \
  16285   __builtin_neon_vld4q_dup_v(&__ret, __p0, 32); \
  16286  \
  16287   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16288   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16289   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16290   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  16291   __ret; \
  16292 })
  16293 #endif
  16294 
  16295 #ifdef __LITTLE_ENDIAN__
  16296 #define vld4q_dup_f32(__p0) __extension__ ({ \
  16297   float32x4x4_t __ret; \
  16298   __builtin_neon_vld4q_dup_v(&__ret, __p0, 41); \
  16299   __ret; \
  16300 })
  16301 #else
  16302 #define vld4q_dup_f32(__p0) __extension__ ({ \
  16303   float32x4x4_t __ret; \
  16304   __builtin_neon_vld4q_dup_v(&__ret, __p0, 41); \
  16305  \
  16306   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16307   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16308   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16309   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16310   __ret; \
  16311 })
  16312 #endif
  16313 
  16314 #ifdef __LITTLE_ENDIAN__
  16315 #define vld4q_dup_s32(__p0) __extension__ ({ \
  16316   int32x4x4_t __ret; \
  16317   __builtin_neon_vld4q_dup_v(&__ret, __p0, 34); \
  16318   __ret; \
  16319 })
  16320 #else
  16321 #define vld4q_dup_s32(__p0) __extension__ ({ \
  16322   int32x4x4_t __ret; \
  16323   __builtin_neon_vld4q_dup_v(&__ret, __p0, 34); \
  16324  \
  16325   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16326   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16327   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16328   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16329   __ret; \
  16330 })
  16331 #endif
  16332 
  16333 #ifdef __LITTLE_ENDIAN__
  16334 #define vld4q_dup_s64(__p0) __extension__ ({ \
  16335   int64x2x4_t __ret; \
  16336   __builtin_neon_vld4q_dup_v(&__ret, __p0, 35); \
  16337   __ret; \
  16338 })
  16339 #else
  16340 #define vld4q_dup_s64(__p0) __extension__ ({ \
  16341   int64x2x4_t __ret; \
  16342   __builtin_neon_vld4q_dup_v(&__ret, __p0, 35); \
  16343  \
  16344   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16345   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16346   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16347   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16348   __ret; \
  16349 })
  16350 #endif
  16351 
  16352 #ifdef __LITTLE_ENDIAN__
  16353 #define vld4q_dup_s16(__p0) __extension__ ({ \
  16354   int16x8x4_t __ret; \
  16355   __builtin_neon_vld4q_dup_v(&__ret, __p0, 33); \
  16356   __ret; \
  16357 })
  16358 #else
  16359 #define vld4q_dup_s16(__p0) __extension__ ({ \
  16360   int16x8x4_t __ret; \
  16361   __builtin_neon_vld4q_dup_v(&__ret, __p0, 33); \
  16362  \
  16363   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16364   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16365   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16366   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16367   __ret; \
  16368 })
  16369 #endif
  16370 
  16371 #ifdef __LITTLE_ENDIAN__
  16372 #define vld4_dup_u8(__p0) __extension__ ({ \
  16373   uint8x8x4_t __ret; \
  16374   __builtin_neon_vld4_dup_v(&__ret, __p0, 16); \
  16375   __ret; \
  16376 })
  16377 #else
  16378 #define vld4_dup_u8(__p0) __extension__ ({ \
  16379   uint8x8x4_t __ret; \
  16380   __builtin_neon_vld4_dup_v(&__ret, __p0, 16); \
  16381  \
  16382   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16383   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16384   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16385   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16386   __ret; \
  16387 })
  16388 #endif
  16389 
  16390 #ifdef __LITTLE_ENDIAN__
  16391 #define vld4_dup_u32(__p0) __extension__ ({ \
  16392   uint32x2x4_t __ret; \
  16393   __builtin_neon_vld4_dup_v(&__ret, __p0, 18); \
  16394   __ret; \
  16395 })
  16396 #else
  16397 #define vld4_dup_u32(__p0) __extension__ ({ \
  16398   uint32x2x4_t __ret; \
  16399   __builtin_neon_vld4_dup_v(&__ret, __p0, 18); \
  16400  \
  16401   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16402   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16403   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16404   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16405   __ret; \
  16406 })
  16407 #endif
  16408 
  16409 #define vld4_dup_u64(__p0) __extension__ ({ \
  16410   uint64x1x4_t __ret; \
  16411   __builtin_neon_vld4_dup_v(&__ret, __p0, 19); \
  16412   __ret; \
  16413 })
  16414 #ifdef __LITTLE_ENDIAN__
  16415 #define vld4_dup_u16(__p0) __extension__ ({ \
  16416   uint16x4x4_t __ret; \
  16417   __builtin_neon_vld4_dup_v(&__ret, __p0, 17); \
  16418   __ret; \
  16419 })
  16420 #else
  16421 #define vld4_dup_u16(__p0) __extension__ ({ \
  16422   uint16x4x4_t __ret; \
  16423   __builtin_neon_vld4_dup_v(&__ret, __p0, 17); \
  16424  \
  16425   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16426   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16427   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16428   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16429   __ret; \
  16430 })
  16431 #endif
  16432 
  16433 #ifdef __LITTLE_ENDIAN__
  16434 #define vld4_dup_s8(__p0) __extension__ ({ \
  16435   int8x8x4_t __ret; \
  16436   __builtin_neon_vld4_dup_v(&__ret, __p0, 0); \
  16437   __ret; \
  16438 })
  16439 #else
  16440 #define vld4_dup_s8(__p0) __extension__ ({ \
  16441   int8x8x4_t __ret; \
  16442   __builtin_neon_vld4_dup_v(&__ret, __p0, 0); \
  16443  \
  16444   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16445   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16446   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16447   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16448   __ret; \
  16449 })
  16450 #endif
  16451 
  16452 #ifdef __LITTLE_ENDIAN__
  16453 #define vld4_dup_f32(__p0) __extension__ ({ \
  16454   float32x2x4_t __ret; \
  16455   __builtin_neon_vld4_dup_v(&__ret, __p0, 9); \
  16456   __ret; \
  16457 })
  16458 #else
  16459 #define vld4_dup_f32(__p0) __extension__ ({ \
  16460   float32x2x4_t __ret; \
  16461   __builtin_neon_vld4_dup_v(&__ret, __p0, 9); \
  16462  \
  16463   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16464   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16465   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16466   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16467   __ret; \
  16468 })
  16469 #endif
  16470 
  16471 #ifdef __LITTLE_ENDIAN__
  16472 #define vld4_dup_s32(__p0) __extension__ ({ \
  16473   int32x2x4_t __ret; \
  16474   __builtin_neon_vld4_dup_v(&__ret, __p0, 2); \
  16475   __ret; \
  16476 })
  16477 #else
  16478 #define vld4_dup_s32(__p0) __extension__ ({ \
  16479   int32x2x4_t __ret; \
  16480   __builtin_neon_vld4_dup_v(&__ret, __p0, 2); \
  16481  \
  16482   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16483   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16484   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16485   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16486   __ret; \
  16487 })
  16488 #endif
  16489 
  16490 #define vld4_dup_s64(__p0) __extension__ ({ \
  16491   int64x1x4_t __ret; \
  16492   __builtin_neon_vld4_dup_v(&__ret, __p0, 3); \
  16493   __ret; \
  16494 })
  16495 #ifdef __LITTLE_ENDIAN__
  16496 #define vld4_dup_s16(__p0) __extension__ ({ \
  16497   int16x4x4_t __ret; \
  16498   __builtin_neon_vld4_dup_v(&__ret, __p0, 1); \
  16499   __ret; \
  16500 })
  16501 #else
  16502 #define vld4_dup_s16(__p0) __extension__ ({ \
  16503   int16x4x4_t __ret; \
  16504   __builtin_neon_vld4_dup_v(&__ret, __p0, 1); \
  16505  \
  16506   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16507   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16508   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16509   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16510   __ret; \
  16511 })
  16512 #endif
  16513 
  16514 #ifdef __LITTLE_ENDIAN__
  16515 #define vld4_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  16516   poly8x8x4_t __ret; \
  16517   poly8x8x4_t __s1 = __p1; \
  16518   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 4); \
  16519   __ret; \
  16520 })
  16521 #else
  16522 #define vld4_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  16523   poly8x8x4_t __ret; \
  16524   poly8x8x4_t __s1 = __p1; \
  16525   poly8x8x4_t __rev1; \
  16526   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16527   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16528   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16529   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16530   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 4); \
  16531  \
  16532   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16533   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16534   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16535   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16536   __ret; \
  16537 })
  16538 #endif
  16539 
  16540 #ifdef __LITTLE_ENDIAN__
  16541 #define vld4_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  16542   poly16x4x4_t __ret; \
  16543   poly16x4x4_t __s1 = __p1; \
  16544   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 5); \
  16545   __ret; \
  16546 })
  16547 #else
  16548 #define vld4_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  16549   poly16x4x4_t __ret; \
  16550   poly16x4x4_t __s1 = __p1; \
  16551   poly16x4x4_t __rev1; \
  16552   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  16553   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  16554   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  16555   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  16556   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 5); \
  16557  \
  16558   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16559   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16560   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16561   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16562   __ret; \
  16563 })
  16564 #endif
  16565 
  16566 #ifdef __LITTLE_ENDIAN__
  16567 #define vld4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  16568   poly16x8x4_t __ret; \
  16569   poly16x8x4_t __s1 = __p1; \
  16570   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 37); \
  16571   __ret; \
  16572 })
  16573 #else
  16574 #define vld4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  16575   poly16x8x4_t __ret; \
  16576   poly16x8x4_t __s1 = __p1; \
  16577   poly16x8x4_t __rev1; \
  16578   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16579   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16580   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16581   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16582   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 37); \
  16583  \
  16584   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16585   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16586   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16587   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16588   __ret; \
  16589 })
  16590 #endif
  16591 
  16592 #ifdef __LITTLE_ENDIAN__
  16593 #define vld4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  16594   uint32x4x4_t __ret; \
  16595   uint32x4x4_t __s1 = __p1; \
  16596   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 50); \
  16597   __ret; \
  16598 })
  16599 #else
  16600 #define vld4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  16601   uint32x4x4_t __ret; \
  16602   uint32x4x4_t __s1 = __p1; \
  16603   uint32x4x4_t __rev1; \
  16604   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  16605   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  16606   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  16607   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  16608   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 50); \
  16609  \
  16610   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16611   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16612   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16613   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16614   __ret; \
  16615 })
  16616 #endif
  16617 
  16618 #ifdef __LITTLE_ENDIAN__
  16619 #define vld4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  16620   uint16x8x4_t __ret; \
  16621   uint16x8x4_t __s1 = __p1; \
  16622   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 49); \
  16623   __ret; \
  16624 })
  16625 #else
  16626 #define vld4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  16627   uint16x8x4_t __ret; \
  16628   uint16x8x4_t __s1 = __p1; \
  16629   uint16x8x4_t __rev1; \
  16630   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16631   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16632   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16633   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16634   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 49); \
  16635  \
  16636   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16637   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16638   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16639   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16640   __ret; \
  16641 })
  16642 #endif
  16643 
  16644 #ifdef __LITTLE_ENDIAN__
  16645 #define vld4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  16646   float32x4x4_t __ret; \
  16647   float32x4x4_t __s1 = __p1; \
  16648   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 41); \
  16649   __ret; \
  16650 })
  16651 #else
  16652 #define vld4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  16653   float32x4x4_t __ret; \
  16654   float32x4x4_t __s1 = __p1; \
  16655   float32x4x4_t __rev1; \
  16656   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  16657   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  16658   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  16659   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  16660   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 41); \
  16661  \
  16662   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16663   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16664   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16665   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16666   __ret; \
  16667 })
  16668 #endif
  16669 
  16670 #ifdef __LITTLE_ENDIAN__
  16671 #define vld4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  16672   int32x4x4_t __ret; \
  16673   int32x4x4_t __s1 = __p1; \
  16674   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 34); \
  16675   __ret; \
  16676 })
  16677 #else
  16678 #define vld4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  16679   int32x4x4_t __ret; \
  16680   int32x4x4_t __s1 = __p1; \
  16681   int32x4x4_t __rev1; \
  16682   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  16683   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  16684   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  16685   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  16686   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 34); \
  16687  \
  16688   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16689   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16690   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16691   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16692   __ret; \
  16693 })
  16694 #endif
  16695 
  16696 #ifdef __LITTLE_ENDIAN__
  16697 #define vld4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  16698   int16x8x4_t __ret; \
  16699   int16x8x4_t __s1 = __p1; \
  16700   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 33); \
  16701   __ret; \
  16702 })
  16703 #else
  16704 #define vld4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  16705   int16x8x4_t __ret; \
  16706   int16x8x4_t __s1 = __p1; \
  16707   int16x8x4_t __rev1; \
  16708   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16709   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16710   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16711   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16712   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 33); \
  16713  \
  16714   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16715   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16716   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16717   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16718   __ret; \
  16719 })
  16720 #endif
  16721 
  16722 #ifdef __LITTLE_ENDIAN__
  16723 #define vld4_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  16724   uint8x8x4_t __ret; \
  16725   uint8x8x4_t __s1 = __p1; \
  16726   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 16); \
  16727   __ret; \
  16728 })
  16729 #else
  16730 #define vld4_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  16731   uint8x8x4_t __ret; \
  16732   uint8x8x4_t __s1 = __p1; \
  16733   uint8x8x4_t __rev1; \
  16734   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16735   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16736   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16737   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16738   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 16); \
  16739  \
  16740   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16741   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16742   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16743   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16744   __ret; \
  16745 })
  16746 #endif
  16747 
  16748 #ifdef __LITTLE_ENDIAN__
  16749 #define vld4_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  16750   uint32x2x4_t __ret; \
  16751   uint32x2x4_t __s1 = __p1; \
  16752   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 18); \
  16753   __ret; \
  16754 })
  16755 #else
  16756 #define vld4_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  16757   uint32x2x4_t __ret; \
  16758   uint32x2x4_t __s1 = __p1; \
  16759   uint32x2x4_t __rev1; \
  16760   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  16761   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  16762   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  16763   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  16764   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 18); \
  16765  \
  16766   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16767   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16768   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16769   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16770   __ret; \
  16771 })
  16772 #endif
  16773 
  16774 #ifdef __LITTLE_ENDIAN__
  16775 #define vld4_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  16776   uint16x4x4_t __ret; \
  16777   uint16x4x4_t __s1 = __p1; \
  16778   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 17); \
  16779   __ret; \
  16780 })
  16781 #else
  16782 #define vld4_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  16783   uint16x4x4_t __ret; \
  16784   uint16x4x4_t __s1 = __p1; \
  16785   uint16x4x4_t __rev1; \
  16786   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  16787   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  16788   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  16789   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  16790   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 17); \
  16791  \
  16792   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16793   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16794   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16795   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16796   __ret; \
  16797 })
  16798 #endif
  16799 
  16800 #ifdef __LITTLE_ENDIAN__
  16801 #define vld4_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  16802   int8x8x4_t __ret; \
  16803   int8x8x4_t __s1 = __p1; \
  16804   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 0); \
  16805   __ret; \
  16806 })
  16807 #else
  16808 #define vld4_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  16809   int8x8x4_t __ret; \
  16810   int8x8x4_t __s1 = __p1; \
  16811   int8x8x4_t __rev1; \
  16812   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16813   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16814   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16815   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16816   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 0); \
  16817  \
  16818   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  16819   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  16820   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  16821   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  16822   __ret; \
  16823 })
  16824 #endif
  16825 
  16826 #ifdef __LITTLE_ENDIAN__
  16827 #define vld4_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  16828   float32x2x4_t __ret; \
  16829   float32x2x4_t __s1 = __p1; \
  16830   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 9); \
  16831   __ret; \
  16832 })
  16833 #else
  16834 #define vld4_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  16835   float32x2x4_t __ret; \
  16836   float32x2x4_t __s1 = __p1; \
  16837   float32x2x4_t __rev1; \
  16838   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  16839   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  16840   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  16841   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  16842   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 9); \
  16843  \
  16844   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16845   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16846   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16847   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16848   __ret; \
  16849 })
  16850 #endif
  16851 
  16852 #ifdef __LITTLE_ENDIAN__
  16853 #define vld4_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  16854   int32x2x4_t __ret; \
  16855   int32x2x4_t __s1 = __p1; \
  16856   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 2); \
  16857   __ret; \
  16858 })
  16859 #else
  16860 #define vld4_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  16861   int32x2x4_t __ret; \
  16862   int32x2x4_t __s1 = __p1; \
  16863   int32x2x4_t __rev1; \
  16864   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  16865   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  16866   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  16867   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  16868   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 2); \
  16869  \
  16870   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  16871   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  16872   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  16873   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  16874   __ret; \
  16875 })
  16876 #endif
  16877 
  16878 #ifdef __LITTLE_ENDIAN__
  16879 #define vld4_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  16880   int16x4x4_t __ret; \
  16881   int16x4x4_t __s1 = __p1; \
  16882   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 1); \
  16883   __ret; \
  16884 })
  16885 #else
  16886 #define vld4_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  16887   int16x4x4_t __ret; \
  16888   int16x4x4_t __s1 = __p1; \
  16889   int16x4x4_t __rev1; \
  16890   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  16891   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  16892   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  16893   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  16894   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 1); \
  16895  \
  16896   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  16897   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  16898   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  16899   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  16900   __ret; \
  16901 })
  16902 #endif
  16903 
  16904 #ifdef __LITTLE_ENDIAN__
  16905 __ai __attribute__((target("neon"))) uint8x16_t vmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  16906   uint8x16_t __ret;
  16907   __ret = (uint8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  16908   return __ret;
  16909 }
  16910 #else
  16911 __ai __attribute__((target("neon"))) uint8x16_t vmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  16912   uint8x16_t __ret;
  16913   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  16914   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  16915   __ret = (uint8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  16916   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  16917   return __ret;
  16918 }
  16919 #endif
  16920 
  16921 #ifdef __LITTLE_ENDIAN__
  16922 __ai __attribute__((target("neon"))) uint32x4_t vmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  16923   uint32x4_t __ret;
  16924   __ret = (uint32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  16925   return __ret;
  16926 }
  16927 #else
  16928 __ai __attribute__((target("neon"))) uint32x4_t vmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  16929   uint32x4_t __ret;
  16930   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  16931   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  16932   __ret = (uint32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  16933   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  16934   return __ret;
  16935 }
  16936 #endif
  16937 
  16938 #ifdef __LITTLE_ENDIAN__
  16939 __ai __attribute__((target("neon"))) uint16x8_t vmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  16940   uint16x8_t __ret;
  16941   __ret = (uint16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  16942   return __ret;
  16943 }
  16944 #else
  16945 __ai __attribute__((target("neon"))) uint16x8_t vmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  16946   uint16x8_t __ret;
  16947   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  16948   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  16949   __ret = (uint16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  16950   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  16951   return __ret;
  16952 }
  16953 #endif
  16954 
  16955 #ifdef __LITTLE_ENDIAN__
  16956 __ai __attribute__((target("neon"))) int8x16_t vmaxq_s8(int8x16_t __p0, int8x16_t __p1) {
  16957   int8x16_t __ret;
  16958   __ret = (int8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  16959   return __ret;
  16960 }
  16961 #else
  16962 __ai __attribute__((target("neon"))) int8x16_t vmaxq_s8(int8x16_t __p0, int8x16_t __p1) {
  16963   int8x16_t __ret;
  16964   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  16965   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  16966   __ret = (int8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  16967   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  16968   return __ret;
  16969 }
  16970 #endif
  16971 
  16972 #ifdef __LITTLE_ENDIAN__
  16973 __ai __attribute__((target("neon"))) float32x4_t vmaxq_f32(float32x4_t __p0, float32x4_t __p1) {
  16974   float32x4_t __ret;
  16975   __ret = (float32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  16976   return __ret;
  16977 }
  16978 #else
  16979 __ai __attribute__((target("neon"))) float32x4_t vmaxq_f32(float32x4_t __p0, float32x4_t __p1) {
  16980   float32x4_t __ret;
  16981   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  16982   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  16983   __ret = (float32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  16984   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  16985   return __ret;
  16986 }
  16987 #endif
  16988 
  16989 #ifdef __LITTLE_ENDIAN__
  16990 __ai __attribute__((target("neon"))) int32x4_t vmaxq_s32(int32x4_t __p0, int32x4_t __p1) {
  16991   int32x4_t __ret;
  16992   __ret = (int32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  16993   return __ret;
  16994 }
  16995 #else
  16996 __ai __attribute__((target("neon"))) int32x4_t vmaxq_s32(int32x4_t __p0, int32x4_t __p1) {
  16997   int32x4_t __ret;
  16998   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  16999   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17000   __ret = (int32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  17001   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17002   return __ret;
  17003 }
  17004 #endif
  17005 
  17006 #ifdef __LITTLE_ENDIAN__
  17007 __ai __attribute__((target("neon"))) int16x8_t vmaxq_s16(int16x8_t __p0, int16x8_t __p1) {
  17008   int16x8_t __ret;
  17009   __ret = (int16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  17010   return __ret;
  17011 }
  17012 #else
  17013 __ai __attribute__((target("neon"))) int16x8_t vmaxq_s16(int16x8_t __p0, int16x8_t __p1) {
  17014   int16x8_t __ret;
  17015   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17016   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17017   __ret = (int16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  17018   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17019   return __ret;
  17020 }
  17021 #endif
  17022 
  17023 #ifdef __LITTLE_ENDIAN__
  17024 __ai __attribute__((target("neon"))) uint8x8_t vmax_u8(uint8x8_t __p0, uint8x8_t __p1) {
  17025   uint8x8_t __ret;
  17026   __ret = (uint8x8_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  17027   return __ret;
  17028 }
  17029 #else
  17030 __ai __attribute__((target("neon"))) uint8x8_t vmax_u8(uint8x8_t __p0, uint8x8_t __p1) {
  17031   uint8x8_t __ret;
  17032   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17033   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17034   __ret = (uint8x8_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  17035   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17036   return __ret;
  17037 }
  17038 #endif
  17039 
  17040 #ifdef __LITTLE_ENDIAN__
  17041 __ai __attribute__((target("neon"))) uint32x2_t vmax_u32(uint32x2_t __p0, uint32x2_t __p1) {
  17042   uint32x2_t __ret;
  17043   __ret = (uint32x2_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  17044   return __ret;
  17045 }
  17046 #else
  17047 __ai __attribute__((target("neon"))) uint32x2_t vmax_u32(uint32x2_t __p0, uint32x2_t __p1) {
  17048   uint32x2_t __ret;
  17049   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17050   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17051   __ret = (uint32x2_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  17052   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17053   return __ret;
  17054 }
  17055 #endif
  17056 
  17057 #ifdef __LITTLE_ENDIAN__
  17058 __ai __attribute__((target("neon"))) uint16x4_t vmax_u16(uint16x4_t __p0, uint16x4_t __p1) {
  17059   uint16x4_t __ret;
  17060   __ret = (uint16x4_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  17061   return __ret;
  17062 }
  17063 #else
  17064 __ai __attribute__((target("neon"))) uint16x4_t vmax_u16(uint16x4_t __p0, uint16x4_t __p1) {
  17065   uint16x4_t __ret;
  17066   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17067   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17068   __ret = (uint16x4_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  17069   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17070   return __ret;
  17071 }
  17072 #endif
  17073 
  17074 #ifdef __LITTLE_ENDIAN__
  17075 __ai __attribute__((target("neon"))) int8x8_t vmax_s8(int8x8_t __p0, int8x8_t __p1) {
  17076   int8x8_t __ret;
  17077   __ret = (int8x8_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  17078   return __ret;
  17079 }
  17080 #else
  17081 __ai __attribute__((target("neon"))) int8x8_t vmax_s8(int8x8_t __p0, int8x8_t __p1) {
  17082   int8x8_t __ret;
  17083   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17084   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17085   __ret = (int8x8_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  17086   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17087   return __ret;
  17088 }
  17089 #endif
  17090 
  17091 #ifdef __LITTLE_ENDIAN__
  17092 __ai __attribute__((target("neon"))) float32x2_t vmax_f32(float32x2_t __p0, float32x2_t __p1) {
  17093   float32x2_t __ret;
  17094   __ret = (float32x2_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  17095   return __ret;
  17096 }
  17097 #else
  17098 __ai __attribute__((target("neon"))) float32x2_t vmax_f32(float32x2_t __p0, float32x2_t __p1) {
  17099   float32x2_t __ret;
  17100   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17101   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17102   __ret = (float32x2_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  17103   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17104   return __ret;
  17105 }
  17106 #endif
  17107 
  17108 #ifdef __LITTLE_ENDIAN__
  17109 __ai __attribute__((target("neon"))) int32x2_t vmax_s32(int32x2_t __p0, int32x2_t __p1) {
  17110   int32x2_t __ret;
  17111   __ret = (int32x2_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  17112   return __ret;
  17113 }
  17114 #else
  17115 __ai __attribute__((target("neon"))) int32x2_t vmax_s32(int32x2_t __p0, int32x2_t __p1) {
  17116   int32x2_t __ret;
  17117   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17118   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17119   __ret = (int32x2_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  17120   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17121   return __ret;
  17122 }
  17123 #endif
  17124 
  17125 #ifdef __LITTLE_ENDIAN__
  17126 __ai __attribute__((target("neon"))) int16x4_t vmax_s16(int16x4_t __p0, int16x4_t __p1) {
  17127   int16x4_t __ret;
  17128   __ret = (int16x4_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  17129   return __ret;
  17130 }
  17131 #else
  17132 __ai __attribute__((target("neon"))) int16x4_t vmax_s16(int16x4_t __p0, int16x4_t __p1) {
  17133   int16x4_t __ret;
  17134   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17135   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17136   __ret = (int16x4_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  17137   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17138   return __ret;
  17139 }
  17140 #endif
  17141 
  17142 #ifdef __LITTLE_ENDIAN__
  17143 __ai __attribute__((target("neon"))) uint8x16_t vminq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  17144   uint8x16_t __ret;
  17145   __ret = (uint8x16_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  17146   return __ret;
  17147 }
  17148 #else
  17149 __ai __attribute__((target("neon"))) uint8x16_t vminq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  17150   uint8x16_t __ret;
  17151   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17152   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17153   __ret = (uint8x16_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  17154   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17155   return __ret;
  17156 }
  17157 #endif
  17158 
  17159 #ifdef __LITTLE_ENDIAN__
  17160 __ai __attribute__((target("neon"))) uint32x4_t vminq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  17161   uint32x4_t __ret;
  17162   __ret = (uint32x4_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  17163   return __ret;
  17164 }
  17165 #else
  17166 __ai __attribute__((target("neon"))) uint32x4_t vminq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  17167   uint32x4_t __ret;
  17168   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17169   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17170   __ret = (uint32x4_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  17171   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17172   return __ret;
  17173 }
  17174 #endif
  17175 
  17176 #ifdef __LITTLE_ENDIAN__
  17177 __ai __attribute__((target("neon"))) uint16x8_t vminq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  17178   uint16x8_t __ret;
  17179   __ret = (uint16x8_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  17180   return __ret;
  17181 }
  17182 #else
  17183 __ai __attribute__((target("neon"))) uint16x8_t vminq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  17184   uint16x8_t __ret;
  17185   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17186   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17187   __ret = (uint16x8_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  17188   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17189   return __ret;
  17190 }
  17191 #endif
  17192 
  17193 #ifdef __LITTLE_ENDIAN__
  17194 __ai __attribute__((target("neon"))) int8x16_t vminq_s8(int8x16_t __p0, int8x16_t __p1) {
  17195   int8x16_t __ret;
  17196   __ret = (int8x16_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  17197   return __ret;
  17198 }
  17199 #else
  17200 __ai __attribute__((target("neon"))) int8x16_t vminq_s8(int8x16_t __p0, int8x16_t __p1) {
  17201   int8x16_t __ret;
  17202   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17203   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17204   __ret = (int8x16_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  17205   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17206   return __ret;
  17207 }
  17208 #endif
  17209 
  17210 #ifdef __LITTLE_ENDIAN__
  17211 __ai __attribute__((target("neon"))) float32x4_t vminq_f32(float32x4_t __p0, float32x4_t __p1) {
  17212   float32x4_t __ret;
  17213   __ret = (float32x4_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  17214   return __ret;
  17215 }
  17216 #else
  17217 __ai __attribute__((target("neon"))) float32x4_t vminq_f32(float32x4_t __p0, float32x4_t __p1) {
  17218   float32x4_t __ret;
  17219   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17220   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17221   __ret = (float32x4_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  17222   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17223   return __ret;
  17224 }
  17225 #endif
  17226 
  17227 #ifdef __LITTLE_ENDIAN__
  17228 __ai __attribute__((target("neon"))) int32x4_t vminq_s32(int32x4_t __p0, int32x4_t __p1) {
  17229   int32x4_t __ret;
  17230   __ret = (int32x4_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  17231   return __ret;
  17232 }
  17233 #else
  17234 __ai __attribute__((target("neon"))) int32x4_t vminq_s32(int32x4_t __p0, int32x4_t __p1) {
  17235   int32x4_t __ret;
  17236   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17237   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17238   __ret = (int32x4_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  17239   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17240   return __ret;
  17241 }
  17242 #endif
  17243 
  17244 #ifdef __LITTLE_ENDIAN__
  17245 __ai __attribute__((target("neon"))) int16x8_t vminq_s16(int16x8_t __p0, int16x8_t __p1) {
  17246   int16x8_t __ret;
  17247   __ret = (int16x8_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  17248   return __ret;
  17249 }
  17250 #else
  17251 __ai __attribute__((target("neon"))) int16x8_t vminq_s16(int16x8_t __p0, int16x8_t __p1) {
  17252   int16x8_t __ret;
  17253   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17254   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17255   __ret = (int16x8_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  17256   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17257   return __ret;
  17258 }
  17259 #endif
  17260 
  17261 #ifdef __LITTLE_ENDIAN__
  17262 __ai __attribute__((target("neon"))) uint8x8_t vmin_u8(uint8x8_t __p0, uint8x8_t __p1) {
  17263   uint8x8_t __ret;
  17264   __ret = (uint8x8_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  17265   return __ret;
  17266 }
  17267 #else
  17268 __ai __attribute__((target("neon"))) uint8x8_t vmin_u8(uint8x8_t __p0, uint8x8_t __p1) {
  17269   uint8x8_t __ret;
  17270   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17271   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17272   __ret = (uint8x8_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  17273   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17274   return __ret;
  17275 }
  17276 #endif
  17277 
  17278 #ifdef __LITTLE_ENDIAN__
  17279 __ai __attribute__((target("neon"))) uint32x2_t vmin_u32(uint32x2_t __p0, uint32x2_t __p1) {
  17280   uint32x2_t __ret;
  17281   __ret = (uint32x2_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  17282   return __ret;
  17283 }
  17284 #else
  17285 __ai __attribute__((target("neon"))) uint32x2_t vmin_u32(uint32x2_t __p0, uint32x2_t __p1) {
  17286   uint32x2_t __ret;
  17287   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17288   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17289   __ret = (uint32x2_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  17290   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17291   return __ret;
  17292 }
  17293 #endif
  17294 
  17295 #ifdef __LITTLE_ENDIAN__
  17296 __ai __attribute__((target("neon"))) uint16x4_t vmin_u16(uint16x4_t __p0, uint16x4_t __p1) {
  17297   uint16x4_t __ret;
  17298   __ret = (uint16x4_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  17299   return __ret;
  17300 }
  17301 #else
  17302 __ai __attribute__((target("neon"))) uint16x4_t vmin_u16(uint16x4_t __p0, uint16x4_t __p1) {
  17303   uint16x4_t __ret;
  17304   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17305   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17306   __ret = (uint16x4_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  17307   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17308   return __ret;
  17309 }
  17310 #endif
  17311 
  17312 #ifdef __LITTLE_ENDIAN__
  17313 __ai __attribute__((target("neon"))) int8x8_t vmin_s8(int8x8_t __p0, int8x8_t __p1) {
  17314   int8x8_t __ret;
  17315   __ret = (int8x8_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  17316   return __ret;
  17317 }
  17318 #else
  17319 __ai __attribute__((target("neon"))) int8x8_t vmin_s8(int8x8_t __p0, int8x8_t __p1) {
  17320   int8x8_t __ret;
  17321   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17322   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17323   __ret = (int8x8_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  17324   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17325   return __ret;
  17326 }
  17327 #endif
  17328 
  17329 #ifdef __LITTLE_ENDIAN__
  17330 __ai __attribute__((target("neon"))) float32x2_t vmin_f32(float32x2_t __p0, float32x2_t __p1) {
  17331   float32x2_t __ret;
  17332   __ret = (float32x2_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  17333   return __ret;
  17334 }
  17335 #else
  17336 __ai __attribute__((target("neon"))) float32x2_t vmin_f32(float32x2_t __p0, float32x2_t __p1) {
  17337   float32x2_t __ret;
  17338   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17339   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17340   __ret = (float32x2_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  17341   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17342   return __ret;
  17343 }
  17344 #endif
  17345 
  17346 #ifdef __LITTLE_ENDIAN__
  17347 __ai __attribute__((target("neon"))) int32x2_t vmin_s32(int32x2_t __p0, int32x2_t __p1) {
  17348   int32x2_t __ret;
  17349   __ret = (int32x2_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  17350   return __ret;
  17351 }
  17352 #else
  17353 __ai __attribute__((target("neon"))) int32x2_t vmin_s32(int32x2_t __p0, int32x2_t __p1) {
  17354   int32x2_t __ret;
  17355   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17356   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17357   __ret = (int32x2_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  17358   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17359   return __ret;
  17360 }
  17361 #endif
  17362 
  17363 #ifdef __LITTLE_ENDIAN__
  17364 __ai __attribute__((target("neon"))) int16x4_t vmin_s16(int16x4_t __p0, int16x4_t __p1) {
  17365   int16x4_t __ret;
  17366   __ret = (int16x4_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  17367   return __ret;
  17368 }
  17369 #else
  17370 __ai __attribute__((target("neon"))) int16x4_t vmin_s16(int16x4_t __p0, int16x4_t __p1) {
  17371   int16x4_t __ret;
  17372   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17373   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17374   __ret = (int16x4_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  17375   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17376   return __ret;
  17377 }
  17378 #endif
  17379 
  17380 #ifdef __LITTLE_ENDIAN__
  17381 __ai __attribute__((target("neon"))) uint8x16_t vmlaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  17382   uint8x16_t __ret;
  17383   __ret = __p0 + __p1 * __p2;
  17384   return __ret;
  17385 }
  17386 #else
  17387 __ai __attribute__((target("neon"))) uint8x16_t vmlaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  17388   uint8x16_t __ret;
  17389   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17390   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17391   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17392   __ret = __rev0 + __rev1 * __rev2;
  17393   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17394   return __ret;
  17395 }
  17396 #endif
  17397 
  17398 #ifdef __LITTLE_ENDIAN__
  17399 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  17400   uint32x4_t __ret;
  17401   __ret = __p0 + __p1 * __p2;
  17402   return __ret;
  17403 }
  17404 #else
  17405 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  17406   uint32x4_t __ret;
  17407   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17408   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17409   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  17410   __ret = __rev0 + __rev1 * __rev2;
  17411   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17412   return __ret;
  17413 }
  17414 #endif
  17415 
  17416 #ifdef __LITTLE_ENDIAN__
  17417 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  17418   uint16x8_t __ret;
  17419   __ret = __p0 + __p1 * __p2;
  17420   return __ret;
  17421 }
  17422 #else
  17423 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  17424   uint16x8_t __ret;
  17425   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17426   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17427   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  17428   __ret = __rev0 + __rev1 * __rev2;
  17429   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17430   return __ret;
  17431 }
  17432 #endif
  17433 
  17434 #ifdef __LITTLE_ENDIAN__
  17435 __ai __attribute__((target("neon"))) int8x16_t vmlaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  17436   int8x16_t __ret;
  17437   __ret = __p0 + __p1 * __p2;
  17438   return __ret;
  17439 }
  17440 #else
  17441 __ai __attribute__((target("neon"))) int8x16_t vmlaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  17442   int8x16_t __ret;
  17443   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17444   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17445   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17446   __ret = __rev0 + __rev1 * __rev2;
  17447   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  17448   return __ret;
  17449 }
  17450 #endif
  17451 
  17452 #ifdef __LITTLE_ENDIAN__
  17453 __ai __attribute__((target("neon"))) float32x4_t vmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  17454   float32x4_t __ret;
  17455   __ret = __p0 + __p1 * __p2;
  17456   return __ret;
  17457 }
  17458 #else
  17459 __ai __attribute__((target("neon"))) float32x4_t vmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  17460   float32x4_t __ret;
  17461   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17462   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17463   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  17464   __ret = __rev0 + __rev1 * __rev2;
  17465   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17466   return __ret;
  17467 }
  17468 #endif
  17469 
  17470 #ifdef __LITTLE_ENDIAN__
  17471 __ai __attribute__((target("neon"))) int32x4_t vmlaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  17472   int32x4_t __ret;
  17473   __ret = __p0 + __p1 * __p2;
  17474   return __ret;
  17475 }
  17476 #else
  17477 __ai __attribute__((target("neon"))) int32x4_t vmlaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  17478   int32x4_t __ret;
  17479   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17480   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17481   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  17482   __ret = __rev0 + __rev1 * __rev2;
  17483   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17484   return __ret;
  17485 }
  17486 #endif
  17487 
  17488 #ifdef __LITTLE_ENDIAN__
  17489 __ai __attribute__((target("neon"))) int16x8_t vmlaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  17490   int16x8_t __ret;
  17491   __ret = __p0 + __p1 * __p2;
  17492   return __ret;
  17493 }
  17494 #else
  17495 __ai __attribute__((target("neon"))) int16x8_t vmlaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  17496   int16x8_t __ret;
  17497   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17498   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17499   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  17500   __ret = __rev0 + __rev1 * __rev2;
  17501   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17502   return __ret;
  17503 }
  17504 #endif
  17505 
  17506 #ifdef __LITTLE_ENDIAN__
  17507 __ai __attribute__((target("neon"))) uint8x8_t vmla_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  17508   uint8x8_t __ret;
  17509   __ret = __p0 + __p1 * __p2;
  17510   return __ret;
  17511 }
  17512 #else
  17513 __ai __attribute__((target("neon"))) uint8x8_t vmla_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  17514   uint8x8_t __ret;
  17515   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17516   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17517   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  17518   __ret = __rev0 + __rev1 * __rev2;
  17519   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17520   return __ret;
  17521 }
  17522 #endif
  17523 
  17524 #ifdef __LITTLE_ENDIAN__
  17525 __ai __attribute__((target("neon"))) uint32x2_t vmla_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  17526   uint32x2_t __ret;
  17527   __ret = __p0 + __p1 * __p2;
  17528   return __ret;
  17529 }
  17530 #else
  17531 __ai __attribute__((target("neon"))) uint32x2_t vmla_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  17532   uint32x2_t __ret;
  17533   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17534   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17535   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  17536   __ret = __rev0 + __rev1 * __rev2;
  17537   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17538   return __ret;
  17539 }
  17540 #endif
  17541 
  17542 #ifdef __LITTLE_ENDIAN__
  17543 __ai __attribute__((target("neon"))) uint16x4_t vmla_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  17544   uint16x4_t __ret;
  17545   __ret = __p0 + __p1 * __p2;
  17546   return __ret;
  17547 }
  17548 #else
  17549 __ai __attribute__((target("neon"))) uint16x4_t vmla_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  17550   uint16x4_t __ret;
  17551   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17552   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17553   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  17554   __ret = __rev0 + __rev1 * __rev2;
  17555   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17556   return __ret;
  17557 }
  17558 #endif
  17559 
  17560 #ifdef __LITTLE_ENDIAN__
  17561 __ai __attribute__((target("neon"))) int8x8_t vmla_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  17562   int8x8_t __ret;
  17563   __ret = __p0 + __p1 * __p2;
  17564   return __ret;
  17565 }
  17566 #else
  17567 __ai __attribute__((target("neon"))) int8x8_t vmla_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  17568   int8x8_t __ret;
  17569   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17570   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17571   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  17572   __ret = __rev0 + __rev1 * __rev2;
  17573   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17574   return __ret;
  17575 }
  17576 #endif
  17577 
  17578 #ifdef __LITTLE_ENDIAN__
  17579 __ai __attribute__((target("neon"))) float32x2_t vmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  17580   float32x2_t __ret;
  17581   __ret = __p0 + __p1 * __p2;
  17582   return __ret;
  17583 }
  17584 #else
  17585 __ai __attribute__((target("neon"))) float32x2_t vmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  17586   float32x2_t __ret;
  17587   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17588   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17589   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  17590   __ret = __rev0 + __rev1 * __rev2;
  17591   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17592   return __ret;
  17593 }
  17594 #endif
  17595 
  17596 #ifdef __LITTLE_ENDIAN__
  17597 __ai __attribute__((target("neon"))) int32x2_t vmla_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  17598   int32x2_t __ret;
  17599   __ret = __p0 + __p1 * __p2;
  17600   return __ret;
  17601 }
  17602 #else
  17603 __ai __attribute__((target("neon"))) int32x2_t vmla_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  17604   int32x2_t __ret;
  17605   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17606   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17607   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  17608   __ret = __rev0 + __rev1 * __rev2;
  17609   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17610   return __ret;
  17611 }
  17612 #endif
  17613 
  17614 #ifdef __LITTLE_ENDIAN__
  17615 __ai __attribute__((target("neon"))) int16x4_t vmla_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  17616   int16x4_t __ret;
  17617   __ret = __p0 + __p1 * __p2;
  17618   return __ret;
  17619 }
  17620 #else
  17621 __ai __attribute__((target("neon"))) int16x4_t vmla_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  17622   int16x4_t __ret;
  17623   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17624   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17625   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  17626   __ret = __rev0 + __rev1 * __rev2;
  17627   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17628   return __ret;
  17629 }
  17630 #endif
  17631 
  17632 #ifdef __LITTLE_ENDIAN__
  17633 #define vmlaq_lane_u32(__p0_54, __p1_54, __p2_54, __p3_54) __extension__ ({ \
  17634   uint32x4_t __ret_54; \
  17635   uint32x4_t __s0_54 = __p0_54; \
  17636   uint32x4_t __s1_54 = __p1_54; \
  17637   uint32x2_t __s2_54 = __p2_54; \
  17638   __ret_54 = __s0_54 + __s1_54 * splatq_lane_u32(__s2_54, __p3_54); \
  17639   __ret_54; \
  17640 })
  17641 #else
  17642 #define vmlaq_lane_u32(__p0_55, __p1_55, __p2_55, __p3_55) __extension__ ({ \
  17643   uint32x4_t __ret_55; \
  17644   uint32x4_t __s0_55 = __p0_55; \
  17645   uint32x4_t __s1_55 = __p1_55; \
  17646   uint32x2_t __s2_55 = __p2_55; \
  17647   uint32x4_t __rev0_55;  __rev0_55 = __builtin_shufflevector(__s0_55, __s0_55, 3, 2, 1, 0); \
  17648   uint32x4_t __rev1_55;  __rev1_55 = __builtin_shufflevector(__s1_55, __s1_55, 3, 2, 1, 0); \
  17649   uint32x2_t __rev2_55;  __rev2_55 = __builtin_shufflevector(__s2_55, __s2_55, 1, 0); \
  17650   __ret_55 = __rev0_55 + __rev1_55 * __noswap_splatq_lane_u32(__rev2_55, __p3_55); \
  17651   __ret_55 = __builtin_shufflevector(__ret_55, __ret_55, 3, 2, 1, 0); \
  17652   __ret_55; \
  17653 })
  17654 #endif
  17655 
  17656 #ifdef __LITTLE_ENDIAN__
  17657 #define vmlaq_lane_u16(__p0_56, __p1_56, __p2_56, __p3_56) __extension__ ({ \
  17658   uint16x8_t __ret_56; \
  17659   uint16x8_t __s0_56 = __p0_56; \
  17660   uint16x8_t __s1_56 = __p1_56; \
  17661   uint16x4_t __s2_56 = __p2_56; \
  17662   __ret_56 = __s0_56 + __s1_56 * splatq_lane_u16(__s2_56, __p3_56); \
  17663   __ret_56; \
  17664 })
  17665 #else
  17666 #define vmlaq_lane_u16(__p0_57, __p1_57, __p2_57, __p3_57) __extension__ ({ \
  17667   uint16x8_t __ret_57; \
  17668   uint16x8_t __s0_57 = __p0_57; \
  17669   uint16x8_t __s1_57 = __p1_57; \
  17670   uint16x4_t __s2_57 = __p2_57; \
  17671   uint16x8_t __rev0_57;  __rev0_57 = __builtin_shufflevector(__s0_57, __s0_57, 7, 6, 5, 4, 3, 2, 1, 0); \
  17672   uint16x8_t __rev1_57;  __rev1_57 = __builtin_shufflevector(__s1_57, __s1_57, 7, 6, 5, 4, 3, 2, 1, 0); \
  17673   uint16x4_t __rev2_57;  __rev2_57 = __builtin_shufflevector(__s2_57, __s2_57, 3, 2, 1, 0); \
  17674   __ret_57 = __rev0_57 + __rev1_57 * __noswap_splatq_lane_u16(__rev2_57, __p3_57); \
  17675   __ret_57 = __builtin_shufflevector(__ret_57, __ret_57, 7, 6, 5, 4, 3, 2, 1, 0); \
  17676   __ret_57; \
  17677 })
  17678 #endif
  17679 
  17680 #ifdef __LITTLE_ENDIAN__
  17681 #define vmlaq_lane_f32(__p0_58, __p1_58, __p2_58, __p3_58) __extension__ ({ \
  17682   float32x4_t __ret_58; \
  17683   float32x4_t __s0_58 = __p0_58; \
  17684   float32x4_t __s1_58 = __p1_58; \
  17685   float32x2_t __s2_58 = __p2_58; \
  17686   __ret_58 = __s0_58 + __s1_58 * splatq_lane_f32(__s2_58, __p3_58); \
  17687   __ret_58; \
  17688 })
  17689 #else
  17690 #define vmlaq_lane_f32(__p0_59, __p1_59, __p2_59, __p3_59) __extension__ ({ \
  17691   float32x4_t __ret_59; \
  17692   float32x4_t __s0_59 = __p0_59; \
  17693   float32x4_t __s1_59 = __p1_59; \
  17694   float32x2_t __s2_59 = __p2_59; \
  17695   float32x4_t __rev0_59;  __rev0_59 = __builtin_shufflevector(__s0_59, __s0_59, 3, 2, 1, 0); \
  17696   float32x4_t __rev1_59;  __rev1_59 = __builtin_shufflevector(__s1_59, __s1_59, 3, 2, 1, 0); \
  17697   float32x2_t __rev2_59;  __rev2_59 = __builtin_shufflevector(__s2_59, __s2_59, 1, 0); \
  17698   __ret_59 = __rev0_59 + __rev1_59 * __noswap_splatq_lane_f32(__rev2_59, __p3_59); \
  17699   __ret_59 = __builtin_shufflevector(__ret_59, __ret_59, 3, 2, 1, 0); \
  17700   __ret_59; \
  17701 })
  17702 #endif
  17703 
  17704 #ifdef __LITTLE_ENDIAN__
  17705 #define vmlaq_lane_s32(__p0_60, __p1_60, __p2_60, __p3_60) __extension__ ({ \
  17706   int32x4_t __ret_60; \
  17707   int32x4_t __s0_60 = __p0_60; \
  17708   int32x4_t __s1_60 = __p1_60; \
  17709   int32x2_t __s2_60 = __p2_60; \
  17710   __ret_60 = __s0_60 + __s1_60 * splatq_lane_s32(__s2_60, __p3_60); \
  17711   __ret_60; \
  17712 })
  17713 #else
  17714 #define vmlaq_lane_s32(__p0_61, __p1_61, __p2_61, __p3_61) __extension__ ({ \
  17715   int32x4_t __ret_61; \
  17716   int32x4_t __s0_61 = __p0_61; \
  17717   int32x4_t __s1_61 = __p1_61; \
  17718   int32x2_t __s2_61 = __p2_61; \
  17719   int32x4_t __rev0_61;  __rev0_61 = __builtin_shufflevector(__s0_61, __s0_61, 3, 2, 1, 0); \
  17720   int32x4_t __rev1_61;  __rev1_61 = __builtin_shufflevector(__s1_61, __s1_61, 3, 2, 1, 0); \
  17721   int32x2_t __rev2_61;  __rev2_61 = __builtin_shufflevector(__s2_61, __s2_61, 1, 0); \
  17722   __ret_61 = __rev0_61 + __rev1_61 * __noswap_splatq_lane_s32(__rev2_61, __p3_61); \
  17723   __ret_61 = __builtin_shufflevector(__ret_61, __ret_61, 3, 2, 1, 0); \
  17724   __ret_61; \
  17725 })
  17726 #endif
  17727 
  17728 #ifdef __LITTLE_ENDIAN__
  17729 #define vmlaq_lane_s16(__p0_62, __p1_62, __p2_62, __p3_62) __extension__ ({ \
  17730   int16x8_t __ret_62; \
  17731   int16x8_t __s0_62 = __p0_62; \
  17732   int16x8_t __s1_62 = __p1_62; \
  17733   int16x4_t __s2_62 = __p2_62; \
  17734   __ret_62 = __s0_62 + __s1_62 * splatq_lane_s16(__s2_62, __p3_62); \
  17735   __ret_62; \
  17736 })
  17737 #else
  17738 #define vmlaq_lane_s16(__p0_63, __p1_63, __p2_63, __p3_63) __extension__ ({ \
  17739   int16x8_t __ret_63; \
  17740   int16x8_t __s0_63 = __p0_63; \
  17741   int16x8_t __s1_63 = __p1_63; \
  17742   int16x4_t __s2_63 = __p2_63; \
  17743   int16x8_t __rev0_63;  __rev0_63 = __builtin_shufflevector(__s0_63, __s0_63, 7, 6, 5, 4, 3, 2, 1, 0); \
  17744   int16x8_t __rev1_63;  __rev1_63 = __builtin_shufflevector(__s1_63, __s1_63, 7, 6, 5, 4, 3, 2, 1, 0); \
  17745   int16x4_t __rev2_63;  __rev2_63 = __builtin_shufflevector(__s2_63, __s2_63, 3, 2, 1, 0); \
  17746   __ret_63 = __rev0_63 + __rev1_63 * __noswap_splatq_lane_s16(__rev2_63, __p3_63); \
  17747   __ret_63 = __builtin_shufflevector(__ret_63, __ret_63, 7, 6, 5, 4, 3, 2, 1, 0); \
  17748   __ret_63; \
  17749 })
  17750 #endif
  17751 
  17752 #ifdef __LITTLE_ENDIAN__
  17753 #define vmla_lane_u32(__p0_64, __p1_64, __p2_64, __p3_64) __extension__ ({ \
  17754   uint32x2_t __ret_64; \
  17755   uint32x2_t __s0_64 = __p0_64; \
  17756   uint32x2_t __s1_64 = __p1_64; \
  17757   uint32x2_t __s2_64 = __p2_64; \
  17758   __ret_64 = __s0_64 + __s1_64 * splat_lane_u32(__s2_64, __p3_64); \
  17759   __ret_64; \
  17760 })
  17761 #else
  17762 #define vmla_lane_u32(__p0_65, __p1_65, __p2_65, __p3_65) __extension__ ({ \
  17763   uint32x2_t __ret_65; \
  17764   uint32x2_t __s0_65 = __p0_65; \
  17765   uint32x2_t __s1_65 = __p1_65; \
  17766   uint32x2_t __s2_65 = __p2_65; \
  17767   uint32x2_t __rev0_65;  __rev0_65 = __builtin_shufflevector(__s0_65, __s0_65, 1, 0); \
  17768   uint32x2_t __rev1_65;  __rev1_65 = __builtin_shufflevector(__s1_65, __s1_65, 1, 0); \
  17769   uint32x2_t __rev2_65;  __rev2_65 = __builtin_shufflevector(__s2_65, __s2_65, 1, 0); \
  17770   __ret_65 = __rev0_65 + __rev1_65 * __noswap_splat_lane_u32(__rev2_65, __p3_65); \
  17771   __ret_65 = __builtin_shufflevector(__ret_65, __ret_65, 1, 0); \
  17772   __ret_65; \
  17773 })
  17774 #endif
  17775 
  17776 #ifdef __LITTLE_ENDIAN__
  17777 #define vmla_lane_u16(__p0_66, __p1_66, __p2_66, __p3_66) __extension__ ({ \
  17778   uint16x4_t __ret_66; \
  17779   uint16x4_t __s0_66 = __p0_66; \
  17780   uint16x4_t __s1_66 = __p1_66; \
  17781   uint16x4_t __s2_66 = __p2_66; \
  17782   __ret_66 = __s0_66 + __s1_66 * splat_lane_u16(__s2_66, __p3_66); \
  17783   __ret_66; \
  17784 })
  17785 #else
  17786 #define vmla_lane_u16(__p0_67, __p1_67, __p2_67, __p3_67) __extension__ ({ \
  17787   uint16x4_t __ret_67; \
  17788   uint16x4_t __s0_67 = __p0_67; \
  17789   uint16x4_t __s1_67 = __p1_67; \
  17790   uint16x4_t __s2_67 = __p2_67; \
  17791   uint16x4_t __rev0_67;  __rev0_67 = __builtin_shufflevector(__s0_67, __s0_67, 3, 2, 1, 0); \
  17792   uint16x4_t __rev1_67;  __rev1_67 = __builtin_shufflevector(__s1_67, __s1_67, 3, 2, 1, 0); \
  17793   uint16x4_t __rev2_67;  __rev2_67 = __builtin_shufflevector(__s2_67, __s2_67, 3, 2, 1, 0); \
  17794   __ret_67 = __rev0_67 + __rev1_67 * __noswap_splat_lane_u16(__rev2_67, __p3_67); \
  17795   __ret_67 = __builtin_shufflevector(__ret_67, __ret_67, 3, 2, 1, 0); \
  17796   __ret_67; \
  17797 })
  17798 #endif
  17799 
  17800 #ifdef __LITTLE_ENDIAN__
  17801 #define vmla_lane_f32(__p0_68, __p1_68, __p2_68, __p3_68) __extension__ ({ \
  17802   float32x2_t __ret_68; \
  17803   float32x2_t __s0_68 = __p0_68; \
  17804   float32x2_t __s1_68 = __p1_68; \
  17805   float32x2_t __s2_68 = __p2_68; \
  17806   __ret_68 = __s0_68 + __s1_68 * splat_lane_f32(__s2_68, __p3_68); \
  17807   __ret_68; \
  17808 })
  17809 #else
  17810 #define vmla_lane_f32(__p0_69, __p1_69, __p2_69, __p3_69) __extension__ ({ \
  17811   float32x2_t __ret_69; \
  17812   float32x2_t __s0_69 = __p0_69; \
  17813   float32x2_t __s1_69 = __p1_69; \
  17814   float32x2_t __s2_69 = __p2_69; \
  17815   float32x2_t __rev0_69;  __rev0_69 = __builtin_shufflevector(__s0_69, __s0_69, 1, 0); \
  17816   float32x2_t __rev1_69;  __rev1_69 = __builtin_shufflevector(__s1_69, __s1_69, 1, 0); \
  17817   float32x2_t __rev2_69;  __rev2_69 = __builtin_shufflevector(__s2_69, __s2_69, 1, 0); \
  17818   __ret_69 = __rev0_69 + __rev1_69 * __noswap_splat_lane_f32(__rev2_69, __p3_69); \
  17819   __ret_69 = __builtin_shufflevector(__ret_69, __ret_69, 1, 0); \
  17820   __ret_69; \
  17821 })
  17822 #endif
  17823 
  17824 #ifdef __LITTLE_ENDIAN__
  17825 #define vmla_lane_s32(__p0_70, __p1_70, __p2_70, __p3_70) __extension__ ({ \
  17826   int32x2_t __ret_70; \
  17827   int32x2_t __s0_70 = __p0_70; \
  17828   int32x2_t __s1_70 = __p1_70; \
  17829   int32x2_t __s2_70 = __p2_70; \
  17830   __ret_70 = __s0_70 + __s1_70 * splat_lane_s32(__s2_70, __p3_70); \
  17831   __ret_70; \
  17832 })
  17833 #else
  17834 #define vmla_lane_s32(__p0_71, __p1_71, __p2_71, __p3_71) __extension__ ({ \
  17835   int32x2_t __ret_71; \
  17836   int32x2_t __s0_71 = __p0_71; \
  17837   int32x2_t __s1_71 = __p1_71; \
  17838   int32x2_t __s2_71 = __p2_71; \
  17839   int32x2_t __rev0_71;  __rev0_71 = __builtin_shufflevector(__s0_71, __s0_71, 1, 0); \
  17840   int32x2_t __rev1_71;  __rev1_71 = __builtin_shufflevector(__s1_71, __s1_71, 1, 0); \
  17841   int32x2_t __rev2_71;  __rev2_71 = __builtin_shufflevector(__s2_71, __s2_71, 1, 0); \
  17842   __ret_71 = __rev0_71 + __rev1_71 * __noswap_splat_lane_s32(__rev2_71, __p3_71); \
  17843   __ret_71 = __builtin_shufflevector(__ret_71, __ret_71, 1, 0); \
  17844   __ret_71; \
  17845 })
  17846 #endif
  17847 
  17848 #ifdef __LITTLE_ENDIAN__
  17849 #define vmla_lane_s16(__p0_72, __p1_72, __p2_72, __p3_72) __extension__ ({ \
  17850   int16x4_t __ret_72; \
  17851   int16x4_t __s0_72 = __p0_72; \
  17852   int16x4_t __s1_72 = __p1_72; \
  17853   int16x4_t __s2_72 = __p2_72; \
  17854   __ret_72 = __s0_72 + __s1_72 * splat_lane_s16(__s2_72, __p3_72); \
  17855   __ret_72; \
  17856 })
  17857 #else
  17858 #define vmla_lane_s16(__p0_73, __p1_73, __p2_73, __p3_73) __extension__ ({ \
  17859   int16x4_t __ret_73; \
  17860   int16x4_t __s0_73 = __p0_73; \
  17861   int16x4_t __s1_73 = __p1_73; \
  17862   int16x4_t __s2_73 = __p2_73; \
  17863   int16x4_t __rev0_73;  __rev0_73 = __builtin_shufflevector(__s0_73, __s0_73, 3, 2, 1, 0); \
  17864   int16x4_t __rev1_73;  __rev1_73 = __builtin_shufflevector(__s1_73, __s1_73, 3, 2, 1, 0); \
  17865   int16x4_t __rev2_73;  __rev2_73 = __builtin_shufflevector(__s2_73, __s2_73, 3, 2, 1, 0); \
  17866   __ret_73 = __rev0_73 + __rev1_73 * __noswap_splat_lane_s16(__rev2_73, __p3_73); \
  17867   __ret_73 = __builtin_shufflevector(__ret_73, __ret_73, 3, 2, 1, 0); \
  17868   __ret_73; \
  17869 })
  17870 #endif
  17871 
  17872 #ifdef __LITTLE_ENDIAN__
  17873 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) {
  17874   uint32x4_t __ret;
  17875   __ret = __p0 + __p1 * (uint32x4_t) {__p2, __p2, __p2, __p2};
  17876   return __ret;
  17877 }
  17878 #else
  17879 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) {
  17880   uint32x4_t __ret;
  17881   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17882   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17883   __ret = __rev0 + __rev1 * (uint32x4_t) {__p2, __p2, __p2, __p2};
  17884   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17885   return __ret;
  17886 }
  17887 #endif
  17888 
  17889 #ifdef __LITTLE_ENDIAN__
  17890 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) {
  17891   uint16x8_t __ret;
  17892   __ret = __p0 + __p1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  17893   return __ret;
  17894 }
  17895 #else
  17896 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) {
  17897   uint16x8_t __ret;
  17898   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17899   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17900   __ret = __rev0 + __rev1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  17901   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17902   return __ret;
  17903 }
  17904 #endif
  17905 
  17906 #ifdef __LITTLE_ENDIAN__
  17907 __ai __attribute__((target("neon"))) float32x4_t vmlaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  17908   float32x4_t __ret;
  17909   __ret = __p0 + __p1 * (float32x4_t) {__p2, __p2, __p2, __p2};
  17910   return __ret;
  17911 }
  17912 #else
  17913 __ai __attribute__((target("neon"))) float32x4_t vmlaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  17914   float32x4_t __ret;
  17915   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17916   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17917   __ret = __rev0 + __rev1 * (float32x4_t) {__p2, __p2, __p2, __p2};
  17918   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17919   return __ret;
  17920 }
  17921 #endif
  17922 
  17923 #ifdef __LITTLE_ENDIAN__
  17924 __ai __attribute__((target("neon"))) int32x4_t vmlaq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) {
  17925   int32x4_t __ret;
  17926   __ret = __p0 + __p1 * (int32x4_t) {__p2, __p2, __p2, __p2};
  17927   return __ret;
  17928 }
  17929 #else
  17930 __ai __attribute__((target("neon"))) int32x4_t vmlaq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) {
  17931   int32x4_t __ret;
  17932   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17933   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17934   __ret = __rev0 + __rev1 * (int32x4_t) {__p2, __p2, __p2, __p2};
  17935   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17936   return __ret;
  17937 }
  17938 #endif
  17939 
  17940 #ifdef __LITTLE_ENDIAN__
  17941 __ai __attribute__((target("neon"))) int16x8_t vmlaq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) {
  17942   int16x8_t __ret;
  17943   __ret = __p0 + __p1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  17944   return __ret;
  17945 }
  17946 #else
  17947 __ai __attribute__((target("neon"))) int16x8_t vmlaq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) {
  17948   int16x8_t __ret;
  17949   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  17950   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  17951   __ret = __rev0 + __rev1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  17952   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  17953   return __ret;
  17954 }
  17955 #endif
  17956 
  17957 #ifdef __LITTLE_ENDIAN__
  17958 __ai __attribute__((target("neon"))) uint32x2_t vmla_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  17959   uint32x2_t __ret;
  17960   __ret = __p0 + __p1 * (uint32x2_t) {__p2, __p2};
  17961   return __ret;
  17962 }
  17963 #else
  17964 __ai __attribute__((target("neon"))) uint32x2_t vmla_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  17965   uint32x2_t __ret;
  17966   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  17967   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  17968   __ret = __rev0 + __rev1 * (uint32x2_t) {__p2, __p2};
  17969   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  17970   return __ret;
  17971 }
  17972 #endif
  17973 
  17974 #ifdef __LITTLE_ENDIAN__
  17975 __ai __attribute__((target("neon"))) uint16x4_t vmla_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  17976   uint16x4_t __ret;
  17977   __ret = __p0 + __p1 * (uint16x4_t) {__p2, __p2, __p2, __p2};
  17978   return __ret;
  17979 }
  17980 #else
  17981 __ai __attribute__((target("neon"))) uint16x4_t vmla_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  17982   uint16x4_t __ret;
  17983   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  17984   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  17985   __ret = __rev0 + __rev1 * (uint16x4_t) {__p2, __p2, __p2, __p2};
  17986   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  17987   return __ret;
  17988 }
  17989 #endif
  17990 
  17991 #ifdef __LITTLE_ENDIAN__
  17992 __ai __attribute__((target("neon"))) float32x2_t vmla_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  17993   float32x2_t __ret;
  17994   __ret = __p0 + __p1 * (float32x2_t) {__p2, __p2};
  17995   return __ret;
  17996 }
  17997 #else
  17998 __ai __attribute__((target("neon"))) float32x2_t vmla_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  17999   float32x2_t __ret;
  18000   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18001   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18002   __ret = __rev0 + __rev1 * (float32x2_t) {__p2, __p2};
  18003   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18004   return __ret;
  18005 }
  18006 #endif
  18007 
  18008 #ifdef __LITTLE_ENDIAN__
  18009 __ai __attribute__((target("neon"))) int32x2_t vmla_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) {
  18010   int32x2_t __ret;
  18011   __ret = __p0 + __p1 * (int32x2_t) {__p2, __p2};
  18012   return __ret;
  18013 }
  18014 #else
  18015 __ai __attribute__((target("neon"))) int32x2_t vmla_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) {
  18016   int32x2_t __ret;
  18017   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18018   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18019   __ret = __rev0 + __rev1 * (int32x2_t) {__p2, __p2};
  18020   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18021   return __ret;
  18022 }
  18023 #endif
  18024 
  18025 #ifdef __LITTLE_ENDIAN__
  18026 __ai __attribute__((target("neon"))) int16x4_t vmla_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) {
  18027   int16x4_t __ret;
  18028   __ret = __p0 + __p1 * (int16x4_t) {__p2, __p2, __p2, __p2};
  18029   return __ret;
  18030 }
  18031 #else
  18032 __ai __attribute__((target("neon"))) int16x4_t vmla_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) {
  18033   int16x4_t __ret;
  18034   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18035   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18036   __ret = __rev0 + __rev1 * (int16x4_t) {__p2, __p2, __p2, __p2};
  18037   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18038   return __ret;
  18039 }
  18040 #endif
  18041 
  18042 #ifdef __LITTLE_ENDIAN__
  18043 __ai __attribute__((target("neon"))) uint8x16_t vmlsq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  18044   uint8x16_t __ret;
  18045   __ret = __p0 - __p1 * __p2;
  18046   return __ret;
  18047 }
  18048 #else
  18049 __ai __attribute__((target("neon"))) uint8x16_t vmlsq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  18050   uint8x16_t __ret;
  18051   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18052   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18053   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18054   __ret = __rev0 - __rev1 * __rev2;
  18055   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18056   return __ret;
  18057 }
  18058 #endif
  18059 
  18060 #ifdef __LITTLE_ENDIAN__
  18061 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  18062   uint32x4_t __ret;
  18063   __ret = __p0 - __p1 * __p2;
  18064   return __ret;
  18065 }
  18066 #else
  18067 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  18068   uint32x4_t __ret;
  18069   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18070   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18071   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  18072   __ret = __rev0 - __rev1 * __rev2;
  18073   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18074   return __ret;
  18075 }
  18076 #endif
  18077 
  18078 #ifdef __LITTLE_ENDIAN__
  18079 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  18080   uint16x8_t __ret;
  18081   __ret = __p0 - __p1 * __p2;
  18082   return __ret;
  18083 }
  18084 #else
  18085 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  18086   uint16x8_t __ret;
  18087   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  18088   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  18089   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  18090   __ret = __rev0 - __rev1 * __rev2;
  18091   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18092   return __ret;
  18093 }
  18094 #endif
  18095 
  18096 #ifdef __LITTLE_ENDIAN__
  18097 __ai __attribute__((target("neon"))) int8x16_t vmlsq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  18098   int8x16_t __ret;
  18099   __ret = __p0 - __p1 * __p2;
  18100   return __ret;
  18101 }
  18102 #else
  18103 __ai __attribute__((target("neon"))) int8x16_t vmlsq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  18104   int8x16_t __ret;
  18105   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18106   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18107   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18108   __ret = __rev0 - __rev1 * __rev2;
  18109   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18110   return __ret;
  18111 }
  18112 #endif
  18113 
  18114 #ifdef __LITTLE_ENDIAN__
  18115 __ai __attribute__((target("neon"))) float32x4_t vmlsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  18116   float32x4_t __ret;
  18117   __ret = __p0 - __p1 * __p2;
  18118   return __ret;
  18119 }
  18120 #else
  18121 __ai __attribute__((target("neon"))) float32x4_t vmlsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  18122   float32x4_t __ret;
  18123   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18124   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18125   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  18126   __ret = __rev0 - __rev1 * __rev2;
  18127   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18128   return __ret;
  18129 }
  18130 #endif
  18131 
  18132 #ifdef __LITTLE_ENDIAN__
  18133 __ai __attribute__((target("neon"))) int32x4_t vmlsq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  18134   int32x4_t __ret;
  18135   __ret = __p0 - __p1 * __p2;
  18136   return __ret;
  18137 }
  18138 #else
  18139 __ai __attribute__((target("neon"))) int32x4_t vmlsq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  18140   int32x4_t __ret;
  18141   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18142   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18143   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  18144   __ret = __rev0 - __rev1 * __rev2;
  18145   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18146   return __ret;
  18147 }
  18148 #endif
  18149 
  18150 #ifdef __LITTLE_ENDIAN__
  18151 __ai __attribute__((target("neon"))) int16x8_t vmlsq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  18152   int16x8_t __ret;
  18153   __ret = __p0 - __p1 * __p2;
  18154   return __ret;
  18155 }
  18156 #else
  18157 __ai __attribute__((target("neon"))) int16x8_t vmlsq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  18158   int16x8_t __ret;
  18159   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  18160   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  18161   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  18162   __ret = __rev0 - __rev1 * __rev2;
  18163   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18164   return __ret;
  18165 }
  18166 #endif
  18167 
  18168 #ifdef __LITTLE_ENDIAN__
  18169 __ai __attribute__((target("neon"))) uint8x8_t vmls_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  18170   uint8x8_t __ret;
  18171   __ret = __p0 - __p1 * __p2;
  18172   return __ret;
  18173 }
  18174 #else
  18175 __ai __attribute__((target("neon"))) uint8x8_t vmls_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  18176   uint8x8_t __ret;
  18177   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  18178   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  18179   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  18180   __ret = __rev0 - __rev1 * __rev2;
  18181   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18182   return __ret;
  18183 }
  18184 #endif
  18185 
  18186 #ifdef __LITTLE_ENDIAN__
  18187 __ai __attribute__((target("neon"))) uint32x2_t vmls_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  18188   uint32x2_t __ret;
  18189   __ret = __p0 - __p1 * __p2;
  18190   return __ret;
  18191 }
  18192 #else
  18193 __ai __attribute__((target("neon"))) uint32x2_t vmls_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  18194   uint32x2_t __ret;
  18195   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18196   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18197   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  18198   __ret = __rev0 - __rev1 * __rev2;
  18199   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18200   return __ret;
  18201 }
  18202 #endif
  18203 
  18204 #ifdef __LITTLE_ENDIAN__
  18205 __ai __attribute__((target("neon"))) uint16x4_t vmls_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  18206   uint16x4_t __ret;
  18207   __ret = __p0 - __p1 * __p2;
  18208   return __ret;
  18209 }
  18210 #else
  18211 __ai __attribute__((target("neon"))) uint16x4_t vmls_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  18212   uint16x4_t __ret;
  18213   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18214   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18215   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  18216   __ret = __rev0 - __rev1 * __rev2;
  18217   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18218   return __ret;
  18219 }
  18220 #endif
  18221 
  18222 #ifdef __LITTLE_ENDIAN__
  18223 __ai __attribute__((target("neon"))) int8x8_t vmls_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  18224   int8x8_t __ret;
  18225   __ret = __p0 - __p1 * __p2;
  18226   return __ret;
  18227 }
  18228 #else
  18229 __ai __attribute__((target("neon"))) int8x8_t vmls_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  18230   int8x8_t __ret;
  18231   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  18232   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  18233   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  18234   __ret = __rev0 - __rev1 * __rev2;
  18235   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18236   return __ret;
  18237 }
  18238 #endif
  18239 
  18240 #ifdef __LITTLE_ENDIAN__
  18241 __ai __attribute__((target("neon"))) float32x2_t vmls_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  18242   float32x2_t __ret;
  18243   __ret = __p0 - __p1 * __p2;
  18244   return __ret;
  18245 }
  18246 #else
  18247 __ai __attribute__((target("neon"))) float32x2_t vmls_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  18248   float32x2_t __ret;
  18249   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18250   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18251   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  18252   __ret = __rev0 - __rev1 * __rev2;
  18253   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18254   return __ret;
  18255 }
  18256 #endif
  18257 
  18258 #ifdef __LITTLE_ENDIAN__
  18259 __ai __attribute__((target("neon"))) int32x2_t vmls_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  18260   int32x2_t __ret;
  18261   __ret = __p0 - __p1 * __p2;
  18262   return __ret;
  18263 }
  18264 #else
  18265 __ai __attribute__((target("neon"))) int32x2_t vmls_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  18266   int32x2_t __ret;
  18267   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18268   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18269   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  18270   __ret = __rev0 - __rev1 * __rev2;
  18271   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18272   return __ret;
  18273 }
  18274 #endif
  18275 
  18276 #ifdef __LITTLE_ENDIAN__
  18277 __ai __attribute__((target("neon"))) int16x4_t vmls_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  18278   int16x4_t __ret;
  18279   __ret = __p0 - __p1 * __p2;
  18280   return __ret;
  18281 }
  18282 #else
  18283 __ai __attribute__((target("neon"))) int16x4_t vmls_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  18284   int16x4_t __ret;
  18285   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18286   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18287   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  18288   __ret = __rev0 - __rev1 * __rev2;
  18289   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18290   return __ret;
  18291 }
  18292 #endif
  18293 
  18294 #ifdef __LITTLE_ENDIAN__
  18295 #define vmlsq_lane_u32(__p0_74, __p1_74, __p2_74, __p3_74) __extension__ ({ \
  18296   uint32x4_t __ret_74; \
  18297   uint32x4_t __s0_74 = __p0_74; \
  18298   uint32x4_t __s1_74 = __p1_74; \
  18299   uint32x2_t __s2_74 = __p2_74; \
  18300   __ret_74 = __s0_74 - __s1_74 * splatq_lane_u32(__s2_74, __p3_74); \
  18301   __ret_74; \
  18302 })
  18303 #else
  18304 #define vmlsq_lane_u32(__p0_75, __p1_75, __p2_75, __p3_75) __extension__ ({ \
  18305   uint32x4_t __ret_75; \
  18306   uint32x4_t __s0_75 = __p0_75; \
  18307   uint32x4_t __s1_75 = __p1_75; \
  18308   uint32x2_t __s2_75 = __p2_75; \
  18309   uint32x4_t __rev0_75;  __rev0_75 = __builtin_shufflevector(__s0_75, __s0_75, 3, 2, 1, 0); \
  18310   uint32x4_t __rev1_75;  __rev1_75 = __builtin_shufflevector(__s1_75, __s1_75, 3, 2, 1, 0); \
  18311   uint32x2_t __rev2_75;  __rev2_75 = __builtin_shufflevector(__s2_75, __s2_75, 1, 0); \
  18312   __ret_75 = __rev0_75 - __rev1_75 * __noswap_splatq_lane_u32(__rev2_75, __p3_75); \
  18313   __ret_75 = __builtin_shufflevector(__ret_75, __ret_75, 3, 2, 1, 0); \
  18314   __ret_75; \
  18315 })
  18316 #endif
  18317 
  18318 #ifdef __LITTLE_ENDIAN__
  18319 #define vmlsq_lane_u16(__p0_76, __p1_76, __p2_76, __p3_76) __extension__ ({ \
  18320   uint16x8_t __ret_76; \
  18321   uint16x8_t __s0_76 = __p0_76; \
  18322   uint16x8_t __s1_76 = __p1_76; \
  18323   uint16x4_t __s2_76 = __p2_76; \
  18324   __ret_76 = __s0_76 - __s1_76 * splatq_lane_u16(__s2_76, __p3_76); \
  18325   __ret_76; \
  18326 })
  18327 #else
  18328 #define vmlsq_lane_u16(__p0_77, __p1_77, __p2_77, __p3_77) __extension__ ({ \
  18329   uint16x8_t __ret_77; \
  18330   uint16x8_t __s0_77 = __p0_77; \
  18331   uint16x8_t __s1_77 = __p1_77; \
  18332   uint16x4_t __s2_77 = __p2_77; \
  18333   uint16x8_t __rev0_77;  __rev0_77 = __builtin_shufflevector(__s0_77, __s0_77, 7, 6, 5, 4, 3, 2, 1, 0); \
  18334   uint16x8_t __rev1_77;  __rev1_77 = __builtin_shufflevector(__s1_77, __s1_77, 7, 6, 5, 4, 3, 2, 1, 0); \
  18335   uint16x4_t __rev2_77;  __rev2_77 = __builtin_shufflevector(__s2_77, __s2_77, 3, 2, 1, 0); \
  18336   __ret_77 = __rev0_77 - __rev1_77 * __noswap_splatq_lane_u16(__rev2_77, __p3_77); \
  18337   __ret_77 = __builtin_shufflevector(__ret_77, __ret_77, 7, 6, 5, 4, 3, 2, 1, 0); \
  18338   __ret_77; \
  18339 })
  18340 #endif
  18341 
  18342 #ifdef __LITTLE_ENDIAN__
  18343 #define vmlsq_lane_f32(__p0_78, __p1_78, __p2_78, __p3_78) __extension__ ({ \
  18344   float32x4_t __ret_78; \
  18345   float32x4_t __s0_78 = __p0_78; \
  18346   float32x4_t __s1_78 = __p1_78; \
  18347   float32x2_t __s2_78 = __p2_78; \
  18348   __ret_78 = __s0_78 - __s1_78 * splatq_lane_f32(__s2_78, __p3_78); \
  18349   __ret_78; \
  18350 })
  18351 #else
  18352 #define vmlsq_lane_f32(__p0_79, __p1_79, __p2_79, __p3_79) __extension__ ({ \
  18353   float32x4_t __ret_79; \
  18354   float32x4_t __s0_79 = __p0_79; \
  18355   float32x4_t __s1_79 = __p1_79; \
  18356   float32x2_t __s2_79 = __p2_79; \
  18357   float32x4_t __rev0_79;  __rev0_79 = __builtin_shufflevector(__s0_79, __s0_79, 3, 2, 1, 0); \
  18358   float32x4_t __rev1_79;  __rev1_79 = __builtin_shufflevector(__s1_79, __s1_79, 3, 2, 1, 0); \
  18359   float32x2_t __rev2_79;  __rev2_79 = __builtin_shufflevector(__s2_79, __s2_79, 1, 0); \
  18360   __ret_79 = __rev0_79 - __rev1_79 * __noswap_splatq_lane_f32(__rev2_79, __p3_79); \
  18361   __ret_79 = __builtin_shufflevector(__ret_79, __ret_79, 3, 2, 1, 0); \
  18362   __ret_79; \
  18363 })
  18364 #endif
  18365 
  18366 #ifdef __LITTLE_ENDIAN__
  18367 #define vmlsq_lane_s32(__p0_80, __p1_80, __p2_80, __p3_80) __extension__ ({ \
  18368   int32x4_t __ret_80; \
  18369   int32x4_t __s0_80 = __p0_80; \
  18370   int32x4_t __s1_80 = __p1_80; \
  18371   int32x2_t __s2_80 = __p2_80; \
  18372   __ret_80 = __s0_80 - __s1_80 * splatq_lane_s32(__s2_80, __p3_80); \
  18373   __ret_80; \
  18374 })
  18375 #else
  18376 #define vmlsq_lane_s32(__p0_81, __p1_81, __p2_81, __p3_81) __extension__ ({ \
  18377   int32x4_t __ret_81; \
  18378   int32x4_t __s0_81 = __p0_81; \
  18379   int32x4_t __s1_81 = __p1_81; \
  18380   int32x2_t __s2_81 = __p2_81; \
  18381   int32x4_t __rev0_81;  __rev0_81 = __builtin_shufflevector(__s0_81, __s0_81, 3, 2, 1, 0); \
  18382   int32x4_t __rev1_81;  __rev1_81 = __builtin_shufflevector(__s1_81, __s1_81, 3, 2, 1, 0); \
  18383   int32x2_t __rev2_81;  __rev2_81 = __builtin_shufflevector(__s2_81, __s2_81, 1, 0); \
  18384   __ret_81 = __rev0_81 - __rev1_81 * __noswap_splatq_lane_s32(__rev2_81, __p3_81); \
  18385   __ret_81 = __builtin_shufflevector(__ret_81, __ret_81, 3, 2, 1, 0); \
  18386   __ret_81; \
  18387 })
  18388 #endif
  18389 
  18390 #ifdef __LITTLE_ENDIAN__
  18391 #define vmlsq_lane_s16(__p0_82, __p1_82, __p2_82, __p3_82) __extension__ ({ \
  18392   int16x8_t __ret_82; \
  18393   int16x8_t __s0_82 = __p0_82; \
  18394   int16x8_t __s1_82 = __p1_82; \
  18395   int16x4_t __s2_82 = __p2_82; \
  18396   __ret_82 = __s0_82 - __s1_82 * splatq_lane_s16(__s2_82, __p3_82); \
  18397   __ret_82; \
  18398 })
  18399 #else
  18400 #define vmlsq_lane_s16(__p0_83, __p1_83, __p2_83, __p3_83) __extension__ ({ \
  18401   int16x8_t __ret_83; \
  18402   int16x8_t __s0_83 = __p0_83; \
  18403   int16x8_t __s1_83 = __p1_83; \
  18404   int16x4_t __s2_83 = __p2_83; \
  18405   int16x8_t __rev0_83;  __rev0_83 = __builtin_shufflevector(__s0_83, __s0_83, 7, 6, 5, 4, 3, 2, 1, 0); \
  18406   int16x8_t __rev1_83;  __rev1_83 = __builtin_shufflevector(__s1_83, __s1_83, 7, 6, 5, 4, 3, 2, 1, 0); \
  18407   int16x4_t __rev2_83;  __rev2_83 = __builtin_shufflevector(__s2_83, __s2_83, 3, 2, 1, 0); \
  18408   __ret_83 = __rev0_83 - __rev1_83 * __noswap_splatq_lane_s16(__rev2_83, __p3_83); \
  18409   __ret_83 = __builtin_shufflevector(__ret_83, __ret_83, 7, 6, 5, 4, 3, 2, 1, 0); \
  18410   __ret_83; \
  18411 })
  18412 #endif
  18413 
  18414 #ifdef __LITTLE_ENDIAN__
  18415 #define vmls_lane_u32(__p0_84, __p1_84, __p2_84, __p3_84) __extension__ ({ \
  18416   uint32x2_t __ret_84; \
  18417   uint32x2_t __s0_84 = __p0_84; \
  18418   uint32x2_t __s1_84 = __p1_84; \
  18419   uint32x2_t __s2_84 = __p2_84; \
  18420   __ret_84 = __s0_84 - __s1_84 * splat_lane_u32(__s2_84, __p3_84); \
  18421   __ret_84; \
  18422 })
  18423 #else
  18424 #define vmls_lane_u32(__p0_85, __p1_85, __p2_85, __p3_85) __extension__ ({ \
  18425   uint32x2_t __ret_85; \
  18426   uint32x2_t __s0_85 = __p0_85; \
  18427   uint32x2_t __s1_85 = __p1_85; \
  18428   uint32x2_t __s2_85 = __p2_85; \
  18429   uint32x2_t __rev0_85;  __rev0_85 = __builtin_shufflevector(__s0_85, __s0_85, 1, 0); \
  18430   uint32x2_t __rev1_85;  __rev1_85 = __builtin_shufflevector(__s1_85, __s1_85, 1, 0); \
  18431   uint32x2_t __rev2_85;  __rev2_85 = __builtin_shufflevector(__s2_85, __s2_85, 1, 0); \
  18432   __ret_85 = __rev0_85 - __rev1_85 * __noswap_splat_lane_u32(__rev2_85, __p3_85); \
  18433   __ret_85 = __builtin_shufflevector(__ret_85, __ret_85, 1, 0); \
  18434   __ret_85; \
  18435 })
  18436 #endif
  18437 
  18438 #ifdef __LITTLE_ENDIAN__
  18439 #define vmls_lane_u16(__p0_86, __p1_86, __p2_86, __p3_86) __extension__ ({ \
  18440   uint16x4_t __ret_86; \
  18441   uint16x4_t __s0_86 = __p0_86; \
  18442   uint16x4_t __s1_86 = __p1_86; \
  18443   uint16x4_t __s2_86 = __p2_86; \
  18444   __ret_86 = __s0_86 - __s1_86 * splat_lane_u16(__s2_86, __p3_86); \
  18445   __ret_86; \
  18446 })
  18447 #else
  18448 #define vmls_lane_u16(__p0_87, __p1_87, __p2_87, __p3_87) __extension__ ({ \
  18449   uint16x4_t __ret_87; \
  18450   uint16x4_t __s0_87 = __p0_87; \
  18451   uint16x4_t __s1_87 = __p1_87; \
  18452   uint16x4_t __s2_87 = __p2_87; \
  18453   uint16x4_t __rev0_87;  __rev0_87 = __builtin_shufflevector(__s0_87, __s0_87, 3, 2, 1, 0); \
  18454   uint16x4_t __rev1_87;  __rev1_87 = __builtin_shufflevector(__s1_87, __s1_87, 3, 2, 1, 0); \
  18455   uint16x4_t __rev2_87;  __rev2_87 = __builtin_shufflevector(__s2_87, __s2_87, 3, 2, 1, 0); \
  18456   __ret_87 = __rev0_87 - __rev1_87 * __noswap_splat_lane_u16(__rev2_87, __p3_87); \
  18457   __ret_87 = __builtin_shufflevector(__ret_87, __ret_87, 3, 2, 1, 0); \
  18458   __ret_87; \
  18459 })
  18460 #endif
  18461 
  18462 #ifdef __LITTLE_ENDIAN__
  18463 #define vmls_lane_f32(__p0_88, __p1_88, __p2_88, __p3_88) __extension__ ({ \
  18464   float32x2_t __ret_88; \
  18465   float32x2_t __s0_88 = __p0_88; \
  18466   float32x2_t __s1_88 = __p1_88; \
  18467   float32x2_t __s2_88 = __p2_88; \
  18468   __ret_88 = __s0_88 - __s1_88 * splat_lane_f32(__s2_88, __p3_88); \
  18469   __ret_88; \
  18470 })
  18471 #else
  18472 #define vmls_lane_f32(__p0_89, __p1_89, __p2_89, __p3_89) __extension__ ({ \
  18473   float32x2_t __ret_89; \
  18474   float32x2_t __s0_89 = __p0_89; \
  18475   float32x2_t __s1_89 = __p1_89; \
  18476   float32x2_t __s2_89 = __p2_89; \
  18477   float32x2_t __rev0_89;  __rev0_89 = __builtin_shufflevector(__s0_89, __s0_89, 1, 0); \
  18478   float32x2_t __rev1_89;  __rev1_89 = __builtin_shufflevector(__s1_89, __s1_89, 1, 0); \
  18479   float32x2_t __rev2_89;  __rev2_89 = __builtin_shufflevector(__s2_89, __s2_89, 1, 0); \
  18480   __ret_89 = __rev0_89 - __rev1_89 * __noswap_splat_lane_f32(__rev2_89, __p3_89); \
  18481   __ret_89 = __builtin_shufflevector(__ret_89, __ret_89, 1, 0); \
  18482   __ret_89; \
  18483 })
  18484 #endif
  18485 
  18486 #ifdef __LITTLE_ENDIAN__
  18487 #define vmls_lane_s32(__p0_90, __p1_90, __p2_90, __p3_90) __extension__ ({ \
  18488   int32x2_t __ret_90; \
  18489   int32x2_t __s0_90 = __p0_90; \
  18490   int32x2_t __s1_90 = __p1_90; \
  18491   int32x2_t __s2_90 = __p2_90; \
  18492   __ret_90 = __s0_90 - __s1_90 * splat_lane_s32(__s2_90, __p3_90); \
  18493   __ret_90; \
  18494 })
  18495 #else
  18496 #define vmls_lane_s32(__p0_91, __p1_91, __p2_91, __p3_91) __extension__ ({ \
  18497   int32x2_t __ret_91; \
  18498   int32x2_t __s0_91 = __p0_91; \
  18499   int32x2_t __s1_91 = __p1_91; \
  18500   int32x2_t __s2_91 = __p2_91; \
  18501   int32x2_t __rev0_91;  __rev0_91 = __builtin_shufflevector(__s0_91, __s0_91, 1, 0); \
  18502   int32x2_t __rev1_91;  __rev1_91 = __builtin_shufflevector(__s1_91, __s1_91, 1, 0); \
  18503   int32x2_t __rev2_91;  __rev2_91 = __builtin_shufflevector(__s2_91, __s2_91, 1, 0); \
  18504   __ret_91 = __rev0_91 - __rev1_91 * __noswap_splat_lane_s32(__rev2_91, __p3_91); \
  18505   __ret_91 = __builtin_shufflevector(__ret_91, __ret_91, 1, 0); \
  18506   __ret_91; \
  18507 })
  18508 #endif
  18509 
  18510 #ifdef __LITTLE_ENDIAN__
  18511 #define vmls_lane_s16(__p0_92, __p1_92, __p2_92, __p3_92) __extension__ ({ \
  18512   int16x4_t __ret_92; \
  18513   int16x4_t __s0_92 = __p0_92; \
  18514   int16x4_t __s1_92 = __p1_92; \
  18515   int16x4_t __s2_92 = __p2_92; \
  18516   __ret_92 = __s0_92 - __s1_92 * splat_lane_s16(__s2_92, __p3_92); \
  18517   __ret_92; \
  18518 })
  18519 #else
  18520 #define vmls_lane_s16(__p0_93, __p1_93, __p2_93, __p3_93) __extension__ ({ \
  18521   int16x4_t __ret_93; \
  18522   int16x4_t __s0_93 = __p0_93; \
  18523   int16x4_t __s1_93 = __p1_93; \
  18524   int16x4_t __s2_93 = __p2_93; \
  18525   int16x4_t __rev0_93;  __rev0_93 = __builtin_shufflevector(__s0_93, __s0_93, 3, 2, 1, 0); \
  18526   int16x4_t __rev1_93;  __rev1_93 = __builtin_shufflevector(__s1_93, __s1_93, 3, 2, 1, 0); \
  18527   int16x4_t __rev2_93;  __rev2_93 = __builtin_shufflevector(__s2_93, __s2_93, 3, 2, 1, 0); \
  18528   __ret_93 = __rev0_93 - __rev1_93 * __noswap_splat_lane_s16(__rev2_93, __p3_93); \
  18529   __ret_93 = __builtin_shufflevector(__ret_93, __ret_93, 3, 2, 1, 0); \
  18530   __ret_93; \
  18531 })
  18532 #endif
  18533 
  18534 #ifdef __LITTLE_ENDIAN__
  18535 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) {
  18536   uint32x4_t __ret;
  18537   __ret = __p0 - __p1 * (uint32x4_t) {__p2, __p2, __p2, __p2};
  18538   return __ret;
  18539 }
  18540 #else
  18541 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) {
  18542   uint32x4_t __ret;
  18543   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18544   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18545   __ret = __rev0 - __rev1 * (uint32x4_t) {__p2, __p2, __p2, __p2};
  18546   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18547   return __ret;
  18548 }
  18549 #endif
  18550 
  18551 #ifdef __LITTLE_ENDIAN__
  18552 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) {
  18553   uint16x8_t __ret;
  18554   __ret = __p0 - __p1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  18555   return __ret;
  18556 }
  18557 #else
  18558 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) {
  18559   uint16x8_t __ret;
  18560   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  18561   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  18562   __ret = __rev0 - __rev1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  18563   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18564   return __ret;
  18565 }
  18566 #endif
  18567 
  18568 #ifdef __LITTLE_ENDIAN__
  18569 __ai __attribute__((target("neon"))) float32x4_t vmlsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  18570   float32x4_t __ret;
  18571   __ret = __p0 - __p1 * (float32x4_t) {__p2, __p2, __p2, __p2};
  18572   return __ret;
  18573 }
  18574 #else
  18575 __ai __attribute__((target("neon"))) float32x4_t vmlsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  18576   float32x4_t __ret;
  18577   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18578   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18579   __ret = __rev0 - __rev1 * (float32x4_t) {__p2, __p2, __p2, __p2};
  18580   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18581   return __ret;
  18582 }
  18583 #endif
  18584 
  18585 #ifdef __LITTLE_ENDIAN__
  18586 __ai __attribute__((target("neon"))) int32x4_t vmlsq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) {
  18587   int32x4_t __ret;
  18588   __ret = __p0 - __p1 * (int32x4_t) {__p2, __p2, __p2, __p2};
  18589   return __ret;
  18590 }
  18591 #else
  18592 __ai __attribute__((target("neon"))) int32x4_t vmlsq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) {
  18593   int32x4_t __ret;
  18594   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18595   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18596   __ret = __rev0 - __rev1 * (int32x4_t) {__p2, __p2, __p2, __p2};
  18597   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18598   return __ret;
  18599 }
  18600 #endif
  18601 
  18602 #ifdef __LITTLE_ENDIAN__
  18603 __ai __attribute__((target("neon"))) int16x8_t vmlsq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) {
  18604   int16x8_t __ret;
  18605   __ret = __p0 - __p1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  18606   return __ret;
  18607 }
  18608 #else
  18609 __ai __attribute__((target("neon"))) int16x8_t vmlsq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) {
  18610   int16x8_t __ret;
  18611   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  18612   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  18613   __ret = __rev0 - __rev1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2};
  18614   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18615   return __ret;
  18616 }
  18617 #endif
  18618 
  18619 #ifdef __LITTLE_ENDIAN__
  18620 __ai __attribute__((target("neon"))) uint32x2_t vmls_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  18621   uint32x2_t __ret;
  18622   __ret = __p0 - __p1 * (uint32x2_t) {__p2, __p2};
  18623   return __ret;
  18624 }
  18625 #else
  18626 __ai __attribute__((target("neon"))) uint32x2_t vmls_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  18627   uint32x2_t __ret;
  18628   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18629   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18630   __ret = __rev0 - __rev1 * (uint32x2_t) {__p2, __p2};
  18631   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18632   return __ret;
  18633 }
  18634 #endif
  18635 
  18636 #ifdef __LITTLE_ENDIAN__
  18637 __ai __attribute__((target("neon"))) uint16x4_t vmls_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  18638   uint16x4_t __ret;
  18639   __ret = __p0 - __p1 * (uint16x4_t) {__p2, __p2, __p2, __p2};
  18640   return __ret;
  18641 }
  18642 #else
  18643 __ai __attribute__((target("neon"))) uint16x4_t vmls_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  18644   uint16x4_t __ret;
  18645   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18646   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18647   __ret = __rev0 - __rev1 * (uint16x4_t) {__p2, __p2, __p2, __p2};
  18648   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18649   return __ret;
  18650 }
  18651 #endif
  18652 
  18653 #ifdef __LITTLE_ENDIAN__
  18654 __ai __attribute__((target("neon"))) float32x2_t vmls_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  18655   float32x2_t __ret;
  18656   __ret = __p0 - __p1 * (float32x2_t) {__p2, __p2};
  18657   return __ret;
  18658 }
  18659 #else
  18660 __ai __attribute__((target("neon"))) float32x2_t vmls_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  18661   float32x2_t __ret;
  18662   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18663   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18664   __ret = __rev0 - __rev1 * (float32x2_t) {__p2, __p2};
  18665   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18666   return __ret;
  18667 }
  18668 #endif
  18669 
  18670 #ifdef __LITTLE_ENDIAN__
  18671 __ai __attribute__((target("neon"))) int32x2_t vmls_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) {
  18672   int32x2_t __ret;
  18673   __ret = __p0 - __p1 * (int32x2_t) {__p2, __p2};
  18674   return __ret;
  18675 }
  18676 #else
  18677 __ai __attribute__((target("neon"))) int32x2_t vmls_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) {
  18678   int32x2_t __ret;
  18679   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  18680   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  18681   __ret = __rev0 - __rev1 * (int32x2_t) {__p2, __p2};
  18682   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18683   return __ret;
  18684 }
  18685 #endif
  18686 
  18687 #ifdef __LITTLE_ENDIAN__
  18688 __ai __attribute__((target("neon"))) int16x4_t vmls_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) {
  18689   int16x4_t __ret;
  18690   __ret = __p0 - __p1 * (int16x4_t) {__p2, __p2, __p2, __p2};
  18691   return __ret;
  18692 }
  18693 #else
  18694 __ai __attribute__((target("neon"))) int16x4_t vmls_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) {
  18695   int16x4_t __ret;
  18696   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  18697   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  18698   __ret = __rev0 - __rev1 * (int16x4_t) {__p2, __p2, __p2, __p2};
  18699   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18700   return __ret;
  18701 }
  18702 #endif
  18703 
  18704 #ifdef __LITTLE_ENDIAN__
  18705 __ai __attribute__((target("neon"))) poly8x8_t vmov_n_p8(poly8_t __p0) {
  18706   poly8x8_t __ret;
  18707   __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18708   return __ret;
  18709 }
  18710 #else
  18711 __ai __attribute__((target("neon"))) poly8x8_t vmov_n_p8(poly8_t __p0) {
  18712   poly8x8_t __ret;
  18713   __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18714   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18715   return __ret;
  18716 }
  18717 #endif
  18718 
  18719 #ifdef __LITTLE_ENDIAN__
  18720 __ai __attribute__((target("neon"))) poly16x4_t vmov_n_p16(poly16_t __p0) {
  18721   poly16x4_t __ret;
  18722   __ret = (poly16x4_t) {__p0, __p0, __p0, __p0};
  18723   return __ret;
  18724 }
  18725 #else
  18726 __ai __attribute__((target("neon"))) poly16x4_t vmov_n_p16(poly16_t __p0) {
  18727   poly16x4_t __ret;
  18728   __ret = (poly16x4_t) {__p0, __p0, __p0, __p0};
  18729   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18730   return __ret;
  18731 }
  18732 #endif
  18733 
  18734 #ifdef __LITTLE_ENDIAN__
  18735 __ai __attribute__((target("neon"))) poly8x16_t vmovq_n_p8(poly8_t __p0) {
  18736   poly8x16_t __ret;
  18737   __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18738   return __ret;
  18739 }
  18740 #else
  18741 __ai __attribute__((target("neon"))) poly8x16_t vmovq_n_p8(poly8_t __p0) {
  18742   poly8x16_t __ret;
  18743   __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18744   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18745   return __ret;
  18746 }
  18747 #endif
  18748 
  18749 #ifdef __LITTLE_ENDIAN__
  18750 __ai __attribute__((target("neon"))) poly16x8_t vmovq_n_p16(poly16_t __p0) {
  18751   poly16x8_t __ret;
  18752   __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18753   return __ret;
  18754 }
  18755 #else
  18756 __ai __attribute__((target("neon"))) poly16x8_t vmovq_n_p16(poly16_t __p0) {
  18757   poly16x8_t __ret;
  18758   __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18759   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18760   return __ret;
  18761 }
  18762 #endif
  18763 
  18764 #ifdef __LITTLE_ENDIAN__
  18765 __ai __attribute__((target("neon"))) uint8x16_t vmovq_n_u8(uint8_t __p0) {
  18766   uint8x16_t __ret;
  18767   __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18768   return __ret;
  18769 }
  18770 #else
  18771 __ai __attribute__((target("neon"))) uint8x16_t vmovq_n_u8(uint8_t __p0) {
  18772   uint8x16_t __ret;
  18773   __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18774   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18775   return __ret;
  18776 }
  18777 #endif
  18778 
  18779 #ifdef __LITTLE_ENDIAN__
  18780 __ai __attribute__((target("neon"))) uint32x4_t vmovq_n_u32(uint32_t __p0) {
  18781   uint32x4_t __ret;
  18782   __ret = (uint32x4_t) {__p0, __p0, __p0, __p0};
  18783   return __ret;
  18784 }
  18785 #else
  18786 __ai __attribute__((target("neon"))) uint32x4_t vmovq_n_u32(uint32_t __p0) {
  18787   uint32x4_t __ret;
  18788   __ret = (uint32x4_t) {__p0, __p0, __p0, __p0};
  18789   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18790   return __ret;
  18791 }
  18792 #endif
  18793 
  18794 #ifdef __LITTLE_ENDIAN__
  18795 __ai __attribute__((target("neon"))) uint64x2_t vmovq_n_u64(uint64_t __p0) {
  18796   uint64x2_t __ret;
  18797   __ret = (uint64x2_t) {__p0, __p0};
  18798   return __ret;
  18799 }
  18800 #else
  18801 __ai __attribute__((target("neon"))) uint64x2_t vmovq_n_u64(uint64_t __p0) {
  18802   uint64x2_t __ret;
  18803   __ret = (uint64x2_t) {__p0, __p0};
  18804   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18805   return __ret;
  18806 }
  18807 #endif
  18808 
  18809 #ifdef __LITTLE_ENDIAN__
  18810 __ai __attribute__((target("neon"))) uint16x8_t vmovq_n_u16(uint16_t __p0) {
  18811   uint16x8_t __ret;
  18812   __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18813   return __ret;
  18814 }
  18815 #else
  18816 __ai __attribute__((target("neon"))) uint16x8_t vmovq_n_u16(uint16_t __p0) {
  18817   uint16x8_t __ret;
  18818   __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18819   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18820   return __ret;
  18821 }
  18822 #endif
  18823 
  18824 #ifdef __LITTLE_ENDIAN__
  18825 __ai __attribute__((target("neon"))) int8x16_t vmovq_n_s8(int8_t __p0) {
  18826   int8x16_t __ret;
  18827   __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18828   return __ret;
  18829 }
  18830 #else
  18831 __ai __attribute__((target("neon"))) int8x16_t vmovq_n_s8(int8_t __p0) {
  18832   int8x16_t __ret;
  18833   __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18834   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  18835   return __ret;
  18836 }
  18837 #endif
  18838 
  18839 #ifdef __LITTLE_ENDIAN__
  18840 __ai __attribute__((target("neon"))) float32x4_t vmovq_n_f32(float32_t __p0) {
  18841   float32x4_t __ret;
  18842   __ret = (float32x4_t) {__p0, __p0, __p0, __p0};
  18843   return __ret;
  18844 }
  18845 #else
  18846 __ai __attribute__((target("neon"))) float32x4_t vmovq_n_f32(float32_t __p0) {
  18847   float32x4_t __ret;
  18848   __ret = (float32x4_t) {__p0, __p0, __p0, __p0};
  18849   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18850   return __ret;
  18851 }
  18852 #endif
  18853 
  18854 #ifdef __LITTLE_ENDIAN__
  18855 #define vmovq_n_f16(__p0) __extension__ ({ \
  18856   float16x8_t __ret; \
  18857   float16_t __s0 = __p0; \
  18858   __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \
  18859   __ret; \
  18860 })
  18861 #else
  18862 #define vmovq_n_f16(__p0) __extension__ ({ \
  18863   float16x8_t __ret; \
  18864   float16_t __s0 = __p0; \
  18865   __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \
  18866   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  18867   __ret; \
  18868 })
  18869 #endif
  18870 
  18871 #ifdef __LITTLE_ENDIAN__
  18872 __ai __attribute__((target("neon"))) int32x4_t vmovq_n_s32(int32_t __p0) {
  18873   int32x4_t __ret;
  18874   __ret = (int32x4_t) {__p0, __p0, __p0, __p0};
  18875   return __ret;
  18876 }
  18877 #else
  18878 __ai __attribute__((target("neon"))) int32x4_t vmovq_n_s32(int32_t __p0) {
  18879   int32x4_t __ret;
  18880   __ret = (int32x4_t) {__p0, __p0, __p0, __p0};
  18881   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18882   return __ret;
  18883 }
  18884 #endif
  18885 
  18886 #ifdef __LITTLE_ENDIAN__
  18887 __ai __attribute__((target("neon"))) int64x2_t vmovq_n_s64(int64_t __p0) {
  18888   int64x2_t __ret;
  18889   __ret = (int64x2_t) {__p0, __p0};
  18890   return __ret;
  18891 }
  18892 #else
  18893 __ai __attribute__((target("neon"))) int64x2_t vmovq_n_s64(int64_t __p0) {
  18894   int64x2_t __ret;
  18895   __ret = (int64x2_t) {__p0, __p0};
  18896   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18897   return __ret;
  18898 }
  18899 #endif
  18900 
  18901 #ifdef __LITTLE_ENDIAN__
  18902 __ai __attribute__((target("neon"))) int16x8_t vmovq_n_s16(int16_t __p0) {
  18903   int16x8_t __ret;
  18904   __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18905   return __ret;
  18906 }
  18907 #else
  18908 __ai __attribute__((target("neon"))) int16x8_t vmovq_n_s16(int16_t __p0) {
  18909   int16x8_t __ret;
  18910   __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18911   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18912   return __ret;
  18913 }
  18914 #endif
  18915 
  18916 #ifdef __LITTLE_ENDIAN__
  18917 __ai __attribute__((target("neon"))) uint8x8_t vmov_n_u8(uint8_t __p0) {
  18918   uint8x8_t __ret;
  18919   __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18920   return __ret;
  18921 }
  18922 #else
  18923 __ai __attribute__((target("neon"))) uint8x8_t vmov_n_u8(uint8_t __p0) {
  18924   uint8x8_t __ret;
  18925   __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18926   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18927   return __ret;
  18928 }
  18929 #endif
  18930 
  18931 #ifdef __LITTLE_ENDIAN__
  18932 __ai __attribute__((target("neon"))) uint32x2_t vmov_n_u32(uint32_t __p0) {
  18933   uint32x2_t __ret;
  18934   __ret = (uint32x2_t) {__p0, __p0};
  18935   return __ret;
  18936 }
  18937 #else
  18938 __ai __attribute__((target("neon"))) uint32x2_t vmov_n_u32(uint32_t __p0) {
  18939   uint32x2_t __ret;
  18940   __ret = (uint32x2_t) {__p0, __p0};
  18941   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18942   return __ret;
  18943 }
  18944 #endif
  18945 
  18946 __ai __attribute__((target("neon"))) uint64x1_t vmov_n_u64(uint64_t __p0) {
  18947   uint64x1_t __ret;
  18948   __ret = (uint64x1_t) {__p0};
  18949   return __ret;
  18950 }
  18951 #ifdef __LITTLE_ENDIAN__
  18952 __ai __attribute__((target("neon"))) uint16x4_t vmov_n_u16(uint16_t __p0) {
  18953   uint16x4_t __ret;
  18954   __ret = (uint16x4_t) {__p0, __p0, __p0, __p0};
  18955   return __ret;
  18956 }
  18957 #else
  18958 __ai __attribute__((target("neon"))) uint16x4_t vmov_n_u16(uint16_t __p0) {
  18959   uint16x4_t __ret;
  18960   __ret = (uint16x4_t) {__p0, __p0, __p0, __p0};
  18961   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  18962   return __ret;
  18963 }
  18964 #endif
  18965 
  18966 #ifdef __LITTLE_ENDIAN__
  18967 __ai __attribute__((target("neon"))) int8x8_t vmov_n_s8(int8_t __p0) {
  18968   int8x8_t __ret;
  18969   __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18970   return __ret;
  18971 }
  18972 #else
  18973 __ai __attribute__((target("neon"))) int8x8_t vmov_n_s8(int8_t __p0) {
  18974   int8x8_t __ret;
  18975   __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0};
  18976   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  18977   return __ret;
  18978 }
  18979 #endif
  18980 
  18981 #ifdef __LITTLE_ENDIAN__
  18982 __ai __attribute__((target("neon"))) float32x2_t vmov_n_f32(float32_t __p0) {
  18983   float32x2_t __ret;
  18984   __ret = (float32x2_t) {__p0, __p0};
  18985   return __ret;
  18986 }
  18987 #else
  18988 __ai __attribute__((target("neon"))) float32x2_t vmov_n_f32(float32_t __p0) {
  18989   float32x2_t __ret;
  18990   __ret = (float32x2_t) {__p0, __p0};
  18991   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  18992   return __ret;
  18993 }
  18994 #endif
  18995 
  18996 #ifdef __LITTLE_ENDIAN__
  18997 #define vmov_n_f16(__p0) __extension__ ({ \
  18998   float16x4_t __ret; \
  18999   float16_t __s0 = __p0; \
  19000   __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \
  19001   __ret; \
  19002 })
  19003 #else
  19004 #define vmov_n_f16(__p0) __extension__ ({ \
  19005   float16x4_t __ret; \
  19006   float16_t __s0 = __p0; \
  19007   __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \
  19008   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  19009   __ret; \
  19010 })
  19011 #endif
  19012 
  19013 #ifdef __LITTLE_ENDIAN__
  19014 __ai __attribute__((target("neon"))) int32x2_t vmov_n_s32(int32_t __p0) {
  19015   int32x2_t __ret;
  19016   __ret = (int32x2_t) {__p0, __p0};
  19017   return __ret;
  19018 }
  19019 #else
  19020 __ai __attribute__((target("neon"))) int32x2_t vmov_n_s32(int32_t __p0) {
  19021   int32x2_t __ret;
  19022   __ret = (int32x2_t) {__p0, __p0};
  19023   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19024   return __ret;
  19025 }
  19026 #endif
  19027 
  19028 __ai __attribute__((target("neon"))) int64x1_t vmov_n_s64(int64_t __p0) {
  19029   int64x1_t __ret;
  19030   __ret = (int64x1_t) {__p0};
  19031   return __ret;
  19032 }
  19033 #ifdef __LITTLE_ENDIAN__
  19034 __ai __attribute__((target("neon"))) int16x4_t vmov_n_s16(int16_t __p0) {
  19035   int16x4_t __ret;
  19036   __ret = (int16x4_t) {__p0, __p0, __p0, __p0};
  19037   return __ret;
  19038 }
  19039 #else
  19040 __ai __attribute__((target("neon"))) int16x4_t vmov_n_s16(int16_t __p0) {
  19041   int16x4_t __ret;
  19042   __ret = (int16x4_t) {__p0, __p0, __p0, __p0};
  19043   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19044   return __ret;
  19045 }
  19046 #endif
  19047 
  19048 #ifdef __LITTLE_ENDIAN__
  19049 __ai __attribute__((target("neon"))) uint16x8_t vmovl_u8(uint8x8_t __p0) {
  19050   uint16x8_t __ret;
  19051   __ret = (uint16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 49);
  19052   return __ret;
  19053 }
  19054 #else
  19055 __ai __attribute__((target("neon"))) uint16x8_t vmovl_u8(uint8x8_t __p0) {
  19056   uint16x8_t __ret;
  19057   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19058   __ret = (uint16x8_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 49);
  19059   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19060   return __ret;
  19061 }
  19062 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmovl_u8(uint8x8_t __p0) {
  19063   uint16x8_t __ret;
  19064   __ret = (uint16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 49);
  19065   return __ret;
  19066 }
  19067 #endif
  19068 
  19069 #ifdef __LITTLE_ENDIAN__
  19070 __ai __attribute__((target("neon"))) uint64x2_t vmovl_u32(uint32x2_t __p0) {
  19071   uint64x2_t __ret;
  19072   __ret = (uint64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 51);
  19073   return __ret;
  19074 }
  19075 #else
  19076 __ai __attribute__((target("neon"))) uint64x2_t vmovl_u32(uint32x2_t __p0) {
  19077   uint64x2_t __ret;
  19078   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19079   __ret = (uint64x2_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 51);
  19080   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19081   return __ret;
  19082 }
  19083 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmovl_u32(uint32x2_t __p0) {
  19084   uint64x2_t __ret;
  19085   __ret = (uint64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 51);
  19086   return __ret;
  19087 }
  19088 #endif
  19089 
  19090 #ifdef __LITTLE_ENDIAN__
  19091 __ai __attribute__((target("neon"))) uint32x4_t vmovl_u16(uint16x4_t __p0) {
  19092   uint32x4_t __ret;
  19093   __ret = (uint32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 50);
  19094   return __ret;
  19095 }
  19096 #else
  19097 __ai __attribute__((target("neon"))) uint32x4_t vmovl_u16(uint16x4_t __p0) {
  19098   uint32x4_t __ret;
  19099   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19100   __ret = (uint32x4_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 50);
  19101   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19102   return __ret;
  19103 }
  19104 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmovl_u16(uint16x4_t __p0) {
  19105   uint32x4_t __ret;
  19106   __ret = (uint32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 50);
  19107   return __ret;
  19108 }
  19109 #endif
  19110 
  19111 #ifdef __LITTLE_ENDIAN__
  19112 __ai __attribute__((target("neon"))) int16x8_t vmovl_s8(int8x8_t __p0) {
  19113   int16x8_t __ret;
  19114   __ret = (int16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 33);
  19115   return __ret;
  19116 }
  19117 #else
  19118 __ai __attribute__((target("neon"))) int16x8_t vmovl_s8(int8x8_t __p0) {
  19119   int16x8_t __ret;
  19120   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19121   __ret = (int16x8_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 33);
  19122   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19123   return __ret;
  19124 }
  19125 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmovl_s8(int8x8_t __p0) {
  19126   int16x8_t __ret;
  19127   __ret = (int16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 33);
  19128   return __ret;
  19129 }
  19130 #endif
  19131 
  19132 #ifdef __LITTLE_ENDIAN__
  19133 __ai __attribute__((target("neon"))) int64x2_t vmovl_s32(int32x2_t __p0) {
  19134   int64x2_t __ret;
  19135   __ret = (int64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 35);
  19136   return __ret;
  19137 }
  19138 #else
  19139 __ai __attribute__((target("neon"))) int64x2_t vmovl_s32(int32x2_t __p0) {
  19140   int64x2_t __ret;
  19141   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19142   __ret = (int64x2_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 35);
  19143   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19144   return __ret;
  19145 }
  19146 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmovl_s32(int32x2_t __p0) {
  19147   int64x2_t __ret;
  19148   __ret = (int64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 35);
  19149   return __ret;
  19150 }
  19151 #endif
  19152 
  19153 #ifdef __LITTLE_ENDIAN__
  19154 __ai __attribute__((target("neon"))) int32x4_t vmovl_s16(int16x4_t __p0) {
  19155   int32x4_t __ret;
  19156   __ret = (int32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 34);
  19157   return __ret;
  19158 }
  19159 #else
  19160 __ai __attribute__((target("neon"))) int32x4_t vmovl_s16(int16x4_t __p0) {
  19161   int32x4_t __ret;
  19162   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19163   __ret = (int32x4_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 34);
  19164   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19165   return __ret;
  19166 }
  19167 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmovl_s16(int16x4_t __p0) {
  19168   int32x4_t __ret;
  19169   __ret = (int32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 34);
  19170   return __ret;
  19171 }
  19172 #endif
  19173 
  19174 #ifdef __LITTLE_ENDIAN__
  19175 __ai __attribute__((target("neon"))) uint16x4_t vmovn_u32(uint32x4_t __p0) {
  19176   uint16x4_t __ret;
  19177   __ret = (uint16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 17);
  19178   return __ret;
  19179 }
  19180 #else
  19181 __ai __attribute__((target("neon"))) uint16x4_t vmovn_u32(uint32x4_t __p0) {
  19182   uint16x4_t __ret;
  19183   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19184   __ret = (uint16x4_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 17);
  19185   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19186   return __ret;
  19187 }
  19188 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vmovn_u32(uint32x4_t __p0) {
  19189   uint16x4_t __ret;
  19190   __ret = (uint16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 17);
  19191   return __ret;
  19192 }
  19193 #endif
  19194 
  19195 #ifdef __LITTLE_ENDIAN__
  19196 __ai __attribute__((target("neon"))) uint32x2_t vmovn_u64(uint64x2_t __p0) {
  19197   uint32x2_t __ret;
  19198   __ret = (uint32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 18);
  19199   return __ret;
  19200 }
  19201 #else
  19202 __ai __attribute__((target("neon"))) uint32x2_t vmovn_u64(uint64x2_t __p0) {
  19203   uint32x2_t __ret;
  19204   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19205   __ret = (uint32x2_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 18);
  19206   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19207   return __ret;
  19208 }
  19209 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vmovn_u64(uint64x2_t __p0) {
  19210   uint32x2_t __ret;
  19211   __ret = (uint32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 18);
  19212   return __ret;
  19213 }
  19214 #endif
  19215 
  19216 #ifdef __LITTLE_ENDIAN__
  19217 __ai __attribute__((target("neon"))) uint8x8_t vmovn_u16(uint16x8_t __p0) {
  19218   uint8x8_t __ret;
  19219   __ret = (uint8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 16);
  19220   return __ret;
  19221 }
  19222 #else
  19223 __ai __attribute__((target("neon"))) uint8x8_t vmovn_u16(uint16x8_t __p0) {
  19224   uint8x8_t __ret;
  19225   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19226   __ret = (uint8x8_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 16);
  19227   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19228   return __ret;
  19229 }
  19230 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vmovn_u16(uint16x8_t __p0) {
  19231   uint8x8_t __ret;
  19232   __ret = (uint8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 16);
  19233   return __ret;
  19234 }
  19235 #endif
  19236 
  19237 #ifdef __LITTLE_ENDIAN__
  19238 __ai __attribute__((target("neon"))) int16x4_t vmovn_s32(int32x4_t __p0) {
  19239   int16x4_t __ret;
  19240   __ret = (int16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 1);
  19241   return __ret;
  19242 }
  19243 #else
  19244 __ai __attribute__((target("neon"))) int16x4_t vmovn_s32(int32x4_t __p0) {
  19245   int16x4_t __ret;
  19246   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19247   __ret = (int16x4_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 1);
  19248   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19249   return __ret;
  19250 }
  19251 __ai __attribute__((target("neon"))) int16x4_t __noswap_vmovn_s32(int32x4_t __p0) {
  19252   int16x4_t __ret;
  19253   __ret = (int16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 1);
  19254   return __ret;
  19255 }
  19256 #endif
  19257 
  19258 #ifdef __LITTLE_ENDIAN__
  19259 __ai __attribute__((target("neon"))) int32x2_t vmovn_s64(int64x2_t __p0) {
  19260   int32x2_t __ret;
  19261   __ret = (int32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 2);
  19262   return __ret;
  19263 }
  19264 #else
  19265 __ai __attribute__((target("neon"))) int32x2_t vmovn_s64(int64x2_t __p0) {
  19266   int32x2_t __ret;
  19267   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19268   __ret = (int32x2_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 2);
  19269   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19270   return __ret;
  19271 }
  19272 __ai __attribute__((target("neon"))) int32x2_t __noswap_vmovn_s64(int64x2_t __p0) {
  19273   int32x2_t __ret;
  19274   __ret = (int32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 2);
  19275   return __ret;
  19276 }
  19277 #endif
  19278 
  19279 #ifdef __LITTLE_ENDIAN__
  19280 __ai __attribute__((target("neon"))) int8x8_t vmovn_s16(int16x8_t __p0) {
  19281   int8x8_t __ret;
  19282   __ret = (int8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 0);
  19283   return __ret;
  19284 }
  19285 #else
  19286 __ai __attribute__((target("neon"))) int8x8_t vmovn_s16(int16x8_t __p0) {
  19287   int8x8_t __ret;
  19288   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19289   __ret = (int8x8_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 0);
  19290   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19291   return __ret;
  19292 }
  19293 __ai __attribute__((target("neon"))) int8x8_t __noswap_vmovn_s16(int16x8_t __p0) {
  19294   int8x8_t __ret;
  19295   __ret = (int8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 0);
  19296   return __ret;
  19297 }
  19298 #endif
  19299 
  19300 #ifdef __LITTLE_ENDIAN__
  19301 __ai __attribute__((target("neon"))) uint8x16_t vmulq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  19302   uint8x16_t __ret;
  19303   __ret = __p0 * __p1;
  19304   return __ret;
  19305 }
  19306 #else
  19307 __ai __attribute__((target("neon"))) uint8x16_t vmulq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  19308   uint8x16_t __ret;
  19309   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19310   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19311   __ret = __rev0 * __rev1;
  19312   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19313   return __ret;
  19314 }
  19315 #endif
  19316 
  19317 #ifdef __LITTLE_ENDIAN__
  19318 __ai __attribute__((target("neon"))) uint32x4_t vmulq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  19319   uint32x4_t __ret;
  19320   __ret = __p0 * __p1;
  19321   return __ret;
  19322 }
  19323 #else
  19324 __ai __attribute__((target("neon"))) uint32x4_t vmulq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  19325   uint32x4_t __ret;
  19326   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19327   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  19328   __ret = __rev0 * __rev1;
  19329   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19330   return __ret;
  19331 }
  19332 #endif
  19333 
  19334 #ifdef __LITTLE_ENDIAN__
  19335 __ai __attribute__((target("neon"))) uint16x8_t vmulq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  19336   uint16x8_t __ret;
  19337   __ret = __p0 * __p1;
  19338   return __ret;
  19339 }
  19340 #else
  19341 __ai __attribute__((target("neon"))) uint16x8_t vmulq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  19342   uint16x8_t __ret;
  19343   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19344   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19345   __ret = __rev0 * __rev1;
  19346   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19347   return __ret;
  19348 }
  19349 #endif
  19350 
  19351 #ifdef __LITTLE_ENDIAN__
  19352 __ai __attribute__((target("neon"))) int8x16_t vmulq_s8(int8x16_t __p0, int8x16_t __p1) {
  19353   int8x16_t __ret;
  19354   __ret = __p0 * __p1;
  19355   return __ret;
  19356 }
  19357 #else
  19358 __ai __attribute__((target("neon"))) int8x16_t vmulq_s8(int8x16_t __p0, int8x16_t __p1) {
  19359   int8x16_t __ret;
  19360   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19361   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19362   __ret = __rev0 * __rev1;
  19363   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19364   return __ret;
  19365 }
  19366 #endif
  19367 
  19368 #ifdef __LITTLE_ENDIAN__
  19369 __ai __attribute__((target("neon"))) float32x4_t vmulq_f32(float32x4_t __p0, float32x4_t __p1) {
  19370   float32x4_t __ret;
  19371   __ret = __p0 * __p1;
  19372   return __ret;
  19373 }
  19374 #else
  19375 __ai __attribute__((target("neon"))) float32x4_t vmulq_f32(float32x4_t __p0, float32x4_t __p1) {
  19376   float32x4_t __ret;
  19377   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19378   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  19379   __ret = __rev0 * __rev1;
  19380   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19381   return __ret;
  19382 }
  19383 #endif
  19384 
  19385 #ifdef __LITTLE_ENDIAN__
  19386 __ai __attribute__((target("neon"))) int32x4_t vmulq_s32(int32x4_t __p0, int32x4_t __p1) {
  19387   int32x4_t __ret;
  19388   __ret = __p0 * __p1;
  19389   return __ret;
  19390 }
  19391 #else
  19392 __ai __attribute__((target("neon"))) int32x4_t vmulq_s32(int32x4_t __p0, int32x4_t __p1) {
  19393   int32x4_t __ret;
  19394   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19395   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  19396   __ret = __rev0 * __rev1;
  19397   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19398   return __ret;
  19399 }
  19400 #endif
  19401 
  19402 #ifdef __LITTLE_ENDIAN__
  19403 __ai __attribute__((target("neon"))) int16x8_t vmulq_s16(int16x8_t __p0, int16x8_t __p1) {
  19404   int16x8_t __ret;
  19405   __ret = __p0 * __p1;
  19406   return __ret;
  19407 }
  19408 #else
  19409 __ai __attribute__((target("neon"))) int16x8_t vmulq_s16(int16x8_t __p0, int16x8_t __p1) {
  19410   int16x8_t __ret;
  19411   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19412   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19413   __ret = __rev0 * __rev1;
  19414   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19415   return __ret;
  19416 }
  19417 #endif
  19418 
  19419 #ifdef __LITTLE_ENDIAN__
  19420 __ai __attribute__((target("neon"))) uint8x8_t vmul_u8(uint8x8_t __p0, uint8x8_t __p1) {
  19421   uint8x8_t __ret;
  19422   __ret = __p0 * __p1;
  19423   return __ret;
  19424 }
  19425 #else
  19426 __ai __attribute__((target("neon"))) uint8x8_t vmul_u8(uint8x8_t __p0, uint8x8_t __p1) {
  19427   uint8x8_t __ret;
  19428   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19429   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19430   __ret = __rev0 * __rev1;
  19431   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19432   return __ret;
  19433 }
  19434 #endif
  19435 
  19436 #ifdef __LITTLE_ENDIAN__
  19437 __ai __attribute__((target("neon"))) uint32x2_t vmul_u32(uint32x2_t __p0, uint32x2_t __p1) {
  19438   uint32x2_t __ret;
  19439   __ret = __p0 * __p1;
  19440   return __ret;
  19441 }
  19442 #else
  19443 __ai __attribute__((target("neon"))) uint32x2_t vmul_u32(uint32x2_t __p0, uint32x2_t __p1) {
  19444   uint32x2_t __ret;
  19445   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19446   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  19447   __ret = __rev0 * __rev1;
  19448   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19449   return __ret;
  19450 }
  19451 #endif
  19452 
  19453 #ifdef __LITTLE_ENDIAN__
  19454 __ai __attribute__((target("neon"))) uint16x4_t vmul_u16(uint16x4_t __p0, uint16x4_t __p1) {
  19455   uint16x4_t __ret;
  19456   __ret = __p0 * __p1;
  19457   return __ret;
  19458 }
  19459 #else
  19460 __ai __attribute__((target("neon"))) uint16x4_t vmul_u16(uint16x4_t __p0, uint16x4_t __p1) {
  19461   uint16x4_t __ret;
  19462   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19463   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  19464   __ret = __rev0 * __rev1;
  19465   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19466   return __ret;
  19467 }
  19468 #endif
  19469 
  19470 #ifdef __LITTLE_ENDIAN__
  19471 __ai __attribute__((target("neon"))) int8x8_t vmul_s8(int8x8_t __p0, int8x8_t __p1) {
  19472   int8x8_t __ret;
  19473   __ret = __p0 * __p1;
  19474   return __ret;
  19475 }
  19476 #else
  19477 __ai __attribute__((target("neon"))) int8x8_t vmul_s8(int8x8_t __p0, int8x8_t __p1) {
  19478   int8x8_t __ret;
  19479   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19480   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19481   __ret = __rev0 * __rev1;
  19482   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19483   return __ret;
  19484 }
  19485 #endif
  19486 
  19487 #ifdef __LITTLE_ENDIAN__
  19488 __ai __attribute__((target("neon"))) float32x2_t vmul_f32(float32x2_t __p0, float32x2_t __p1) {
  19489   float32x2_t __ret;
  19490   __ret = __p0 * __p1;
  19491   return __ret;
  19492 }
  19493 #else
  19494 __ai __attribute__((target("neon"))) float32x2_t vmul_f32(float32x2_t __p0, float32x2_t __p1) {
  19495   float32x2_t __ret;
  19496   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19497   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  19498   __ret = __rev0 * __rev1;
  19499   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19500   return __ret;
  19501 }
  19502 #endif
  19503 
  19504 #ifdef __LITTLE_ENDIAN__
  19505 __ai __attribute__((target("neon"))) int32x2_t vmul_s32(int32x2_t __p0, int32x2_t __p1) {
  19506   int32x2_t __ret;
  19507   __ret = __p0 * __p1;
  19508   return __ret;
  19509 }
  19510 #else
  19511 __ai __attribute__((target("neon"))) int32x2_t vmul_s32(int32x2_t __p0, int32x2_t __p1) {
  19512   int32x2_t __ret;
  19513   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19514   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  19515   __ret = __rev0 * __rev1;
  19516   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19517   return __ret;
  19518 }
  19519 #endif
  19520 
  19521 #ifdef __LITTLE_ENDIAN__
  19522 __ai __attribute__((target("neon"))) int16x4_t vmul_s16(int16x4_t __p0, int16x4_t __p1) {
  19523   int16x4_t __ret;
  19524   __ret = __p0 * __p1;
  19525   return __ret;
  19526 }
  19527 #else
  19528 __ai __attribute__((target("neon"))) int16x4_t vmul_s16(int16x4_t __p0, int16x4_t __p1) {
  19529   int16x4_t __ret;
  19530   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19531   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  19532   __ret = __rev0 * __rev1;
  19533   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19534   return __ret;
  19535 }
  19536 #endif
  19537 
  19538 #ifdef __LITTLE_ENDIAN__
  19539 __ai __attribute__((target("neon"))) poly8x8_t vmul_p8(poly8x8_t __p0, poly8x8_t __p1) {
  19540   poly8x8_t __ret;
  19541   __ret = (poly8x8_t) __builtin_neon_vmul_v((int8x8_t)__p0, (int8x8_t)__p1, 4);
  19542   return __ret;
  19543 }
  19544 #else
  19545 __ai __attribute__((target("neon"))) poly8x8_t vmul_p8(poly8x8_t __p0, poly8x8_t __p1) {
  19546   poly8x8_t __ret;
  19547   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19548   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19549   __ret = (poly8x8_t) __builtin_neon_vmul_v((int8x8_t)__rev0, (int8x8_t)__rev1, 4);
  19550   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19551   return __ret;
  19552 }
  19553 #endif
  19554 
  19555 #ifdef __LITTLE_ENDIAN__
  19556 __ai __attribute__((target("neon"))) poly8x16_t vmulq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  19557   poly8x16_t __ret;
  19558   __ret = (poly8x16_t) __builtin_neon_vmulq_v((int8x16_t)__p0, (int8x16_t)__p1, 36);
  19559   return __ret;
  19560 }
  19561 #else
  19562 __ai __attribute__((target("neon"))) poly8x16_t vmulq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  19563   poly8x16_t __ret;
  19564   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19565   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19566   __ret = (poly8x16_t) __builtin_neon_vmulq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 36);
  19567   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  19568   return __ret;
  19569 }
  19570 #endif
  19571 
  19572 #ifdef __LITTLE_ENDIAN__
  19573 #define vmulq_lane_u32(__p0_94, __p1_94, __p2_94) __extension__ ({ \
  19574   uint32x4_t __ret_94; \
  19575   uint32x4_t __s0_94 = __p0_94; \
  19576   uint32x2_t __s1_94 = __p1_94; \
  19577   __ret_94 = __s0_94 * splatq_lane_u32(__s1_94, __p2_94); \
  19578   __ret_94; \
  19579 })
  19580 #else
  19581 #define vmulq_lane_u32(__p0_95, __p1_95, __p2_95) __extension__ ({ \
  19582   uint32x4_t __ret_95; \
  19583   uint32x4_t __s0_95 = __p0_95; \
  19584   uint32x2_t __s1_95 = __p1_95; \
  19585   uint32x4_t __rev0_95;  __rev0_95 = __builtin_shufflevector(__s0_95, __s0_95, 3, 2, 1, 0); \
  19586   uint32x2_t __rev1_95;  __rev1_95 = __builtin_shufflevector(__s1_95, __s1_95, 1, 0); \
  19587   __ret_95 = __rev0_95 * __noswap_splatq_lane_u32(__rev1_95, __p2_95); \
  19588   __ret_95 = __builtin_shufflevector(__ret_95, __ret_95, 3, 2, 1, 0); \
  19589   __ret_95; \
  19590 })
  19591 #endif
  19592 
  19593 #ifdef __LITTLE_ENDIAN__
  19594 #define vmulq_lane_u16(__p0_96, __p1_96, __p2_96) __extension__ ({ \
  19595   uint16x8_t __ret_96; \
  19596   uint16x8_t __s0_96 = __p0_96; \
  19597   uint16x4_t __s1_96 = __p1_96; \
  19598   __ret_96 = __s0_96 * splatq_lane_u16(__s1_96, __p2_96); \
  19599   __ret_96; \
  19600 })
  19601 #else
  19602 #define vmulq_lane_u16(__p0_97, __p1_97, __p2_97) __extension__ ({ \
  19603   uint16x8_t __ret_97; \
  19604   uint16x8_t __s0_97 = __p0_97; \
  19605   uint16x4_t __s1_97 = __p1_97; \
  19606   uint16x8_t __rev0_97;  __rev0_97 = __builtin_shufflevector(__s0_97, __s0_97, 7, 6, 5, 4, 3, 2, 1, 0); \
  19607   uint16x4_t __rev1_97;  __rev1_97 = __builtin_shufflevector(__s1_97, __s1_97, 3, 2, 1, 0); \
  19608   __ret_97 = __rev0_97 * __noswap_splatq_lane_u16(__rev1_97, __p2_97); \
  19609   __ret_97 = __builtin_shufflevector(__ret_97, __ret_97, 7, 6, 5, 4, 3, 2, 1, 0); \
  19610   __ret_97; \
  19611 })
  19612 #endif
  19613 
  19614 #ifdef __LITTLE_ENDIAN__
  19615 #define vmulq_lane_f32(__p0_98, __p1_98, __p2_98) __extension__ ({ \
  19616   float32x4_t __ret_98; \
  19617   float32x4_t __s0_98 = __p0_98; \
  19618   float32x2_t __s1_98 = __p1_98; \
  19619   __ret_98 = __s0_98 * splatq_lane_f32(__s1_98, __p2_98); \
  19620   __ret_98; \
  19621 })
  19622 #else
  19623 #define vmulq_lane_f32(__p0_99, __p1_99, __p2_99) __extension__ ({ \
  19624   float32x4_t __ret_99; \
  19625   float32x4_t __s0_99 = __p0_99; \
  19626   float32x2_t __s1_99 = __p1_99; \
  19627   float32x4_t __rev0_99;  __rev0_99 = __builtin_shufflevector(__s0_99, __s0_99, 3, 2, 1, 0); \
  19628   float32x2_t __rev1_99;  __rev1_99 = __builtin_shufflevector(__s1_99, __s1_99, 1, 0); \
  19629   __ret_99 = __rev0_99 * __noswap_splatq_lane_f32(__rev1_99, __p2_99); \
  19630   __ret_99 = __builtin_shufflevector(__ret_99, __ret_99, 3, 2, 1, 0); \
  19631   __ret_99; \
  19632 })
  19633 #endif
  19634 
  19635 #ifdef __LITTLE_ENDIAN__
  19636 #define vmulq_lane_s32(__p0_100, __p1_100, __p2_100) __extension__ ({ \
  19637   int32x4_t __ret_100; \
  19638   int32x4_t __s0_100 = __p0_100; \
  19639   int32x2_t __s1_100 = __p1_100; \
  19640   __ret_100 = __s0_100 * splatq_lane_s32(__s1_100, __p2_100); \
  19641   __ret_100; \
  19642 })
  19643 #else
  19644 #define vmulq_lane_s32(__p0_101, __p1_101, __p2_101) __extension__ ({ \
  19645   int32x4_t __ret_101; \
  19646   int32x4_t __s0_101 = __p0_101; \
  19647   int32x2_t __s1_101 = __p1_101; \
  19648   int32x4_t __rev0_101;  __rev0_101 = __builtin_shufflevector(__s0_101, __s0_101, 3, 2, 1, 0); \
  19649   int32x2_t __rev1_101;  __rev1_101 = __builtin_shufflevector(__s1_101, __s1_101, 1, 0); \
  19650   __ret_101 = __rev0_101 * __noswap_splatq_lane_s32(__rev1_101, __p2_101); \
  19651   __ret_101 = __builtin_shufflevector(__ret_101, __ret_101, 3, 2, 1, 0); \
  19652   __ret_101; \
  19653 })
  19654 #endif
  19655 
  19656 #ifdef __LITTLE_ENDIAN__
  19657 #define vmulq_lane_s16(__p0_102, __p1_102, __p2_102) __extension__ ({ \
  19658   int16x8_t __ret_102; \
  19659   int16x8_t __s0_102 = __p0_102; \
  19660   int16x4_t __s1_102 = __p1_102; \
  19661   __ret_102 = __s0_102 * splatq_lane_s16(__s1_102, __p2_102); \
  19662   __ret_102; \
  19663 })
  19664 #else
  19665 #define vmulq_lane_s16(__p0_103, __p1_103, __p2_103) __extension__ ({ \
  19666   int16x8_t __ret_103; \
  19667   int16x8_t __s0_103 = __p0_103; \
  19668   int16x4_t __s1_103 = __p1_103; \
  19669   int16x8_t __rev0_103;  __rev0_103 = __builtin_shufflevector(__s0_103, __s0_103, 7, 6, 5, 4, 3, 2, 1, 0); \
  19670   int16x4_t __rev1_103;  __rev1_103 = __builtin_shufflevector(__s1_103, __s1_103, 3, 2, 1, 0); \
  19671   __ret_103 = __rev0_103 * __noswap_splatq_lane_s16(__rev1_103, __p2_103); \
  19672   __ret_103 = __builtin_shufflevector(__ret_103, __ret_103, 7, 6, 5, 4, 3, 2, 1, 0); \
  19673   __ret_103; \
  19674 })
  19675 #endif
  19676 
  19677 #ifdef __LITTLE_ENDIAN__
  19678 #define vmul_lane_u32(__p0_104, __p1_104, __p2_104) __extension__ ({ \
  19679   uint32x2_t __ret_104; \
  19680   uint32x2_t __s0_104 = __p0_104; \
  19681   uint32x2_t __s1_104 = __p1_104; \
  19682   __ret_104 = __s0_104 * splat_lane_u32(__s1_104, __p2_104); \
  19683   __ret_104; \
  19684 })
  19685 #else
  19686 #define vmul_lane_u32(__p0_105, __p1_105, __p2_105) __extension__ ({ \
  19687   uint32x2_t __ret_105; \
  19688   uint32x2_t __s0_105 = __p0_105; \
  19689   uint32x2_t __s1_105 = __p1_105; \
  19690   uint32x2_t __rev0_105;  __rev0_105 = __builtin_shufflevector(__s0_105, __s0_105, 1, 0); \
  19691   uint32x2_t __rev1_105;  __rev1_105 = __builtin_shufflevector(__s1_105, __s1_105, 1, 0); \
  19692   __ret_105 = __rev0_105 * __noswap_splat_lane_u32(__rev1_105, __p2_105); \
  19693   __ret_105 = __builtin_shufflevector(__ret_105, __ret_105, 1, 0); \
  19694   __ret_105; \
  19695 })
  19696 #endif
  19697 
  19698 #ifdef __LITTLE_ENDIAN__
  19699 #define vmul_lane_u16(__p0_106, __p1_106, __p2_106) __extension__ ({ \
  19700   uint16x4_t __ret_106; \
  19701   uint16x4_t __s0_106 = __p0_106; \
  19702   uint16x4_t __s1_106 = __p1_106; \
  19703   __ret_106 = __s0_106 * splat_lane_u16(__s1_106, __p2_106); \
  19704   __ret_106; \
  19705 })
  19706 #else
  19707 #define vmul_lane_u16(__p0_107, __p1_107, __p2_107) __extension__ ({ \
  19708   uint16x4_t __ret_107; \
  19709   uint16x4_t __s0_107 = __p0_107; \
  19710   uint16x4_t __s1_107 = __p1_107; \
  19711   uint16x4_t __rev0_107;  __rev0_107 = __builtin_shufflevector(__s0_107, __s0_107, 3, 2, 1, 0); \
  19712   uint16x4_t __rev1_107;  __rev1_107 = __builtin_shufflevector(__s1_107, __s1_107, 3, 2, 1, 0); \
  19713   __ret_107 = __rev0_107 * __noswap_splat_lane_u16(__rev1_107, __p2_107); \
  19714   __ret_107 = __builtin_shufflevector(__ret_107, __ret_107, 3, 2, 1, 0); \
  19715   __ret_107; \
  19716 })
  19717 #endif
  19718 
  19719 #ifdef __LITTLE_ENDIAN__
  19720 #define vmul_lane_f32(__p0_108, __p1_108, __p2_108) __extension__ ({ \
  19721   float32x2_t __ret_108; \
  19722   float32x2_t __s0_108 = __p0_108; \
  19723   float32x2_t __s1_108 = __p1_108; \
  19724   __ret_108 = __s0_108 * splat_lane_f32(__s1_108, __p2_108); \
  19725   __ret_108; \
  19726 })
  19727 #else
  19728 #define vmul_lane_f32(__p0_109, __p1_109, __p2_109) __extension__ ({ \
  19729   float32x2_t __ret_109; \
  19730   float32x2_t __s0_109 = __p0_109; \
  19731   float32x2_t __s1_109 = __p1_109; \
  19732   float32x2_t __rev0_109;  __rev0_109 = __builtin_shufflevector(__s0_109, __s0_109, 1, 0); \
  19733   float32x2_t __rev1_109;  __rev1_109 = __builtin_shufflevector(__s1_109, __s1_109, 1, 0); \
  19734   __ret_109 = __rev0_109 * __noswap_splat_lane_f32(__rev1_109, __p2_109); \
  19735   __ret_109 = __builtin_shufflevector(__ret_109, __ret_109, 1, 0); \
  19736   __ret_109; \
  19737 })
  19738 #endif
  19739 
  19740 #ifdef __LITTLE_ENDIAN__
  19741 #define vmul_lane_s32(__p0_110, __p1_110, __p2_110) __extension__ ({ \
  19742   int32x2_t __ret_110; \
  19743   int32x2_t __s0_110 = __p0_110; \
  19744   int32x2_t __s1_110 = __p1_110; \
  19745   __ret_110 = __s0_110 * splat_lane_s32(__s1_110, __p2_110); \
  19746   __ret_110; \
  19747 })
  19748 #else
  19749 #define vmul_lane_s32(__p0_111, __p1_111, __p2_111) __extension__ ({ \
  19750   int32x2_t __ret_111; \
  19751   int32x2_t __s0_111 = __p0_111; \
  19752   int32x2_t __s1_111 = __p1_111; \
  19753   int32x2_t __rev0_111;  __rev0_111 = __builtin_shufflevector(__s0_111, __s0_111, 1, 0); \
  19754   int32x2_t __rev1_111;  __rev1_111 = __builtin_shufflevector(__s1_111, __s1_111, 1, 0); \
  19755   __ret_111 = __rev0_111 * __noswap_splat_lane_s32(__rev1_111, __p2_111); \
  19756   __ret_111 = __builtin_shufflevector(__ret_111, __ret_111, 1, 0); \
  19757   __ret_111; \
  19758 })
  19759 #endif
  19760 
  19761 #ifdef __LITTLE_ENDIAN__
  19762 #define vmul_lane_s16(__p0_112, __p1_112, __p2_112) __extension__ ({ \
  19763   int16x4_t __ret_112; \
  19764   int16x4_t __s0_112 = __p0_112; \
  19765   int16x4_t __s1_112 = __p1_112; \
  19766   __ret_112 = __s0_112 * splat_lane_s16(__s1_112, __p2_112); \
  19767   __ret_112; \
  19768 })
  19769 #else
  19770 #define vmul_lane_s16(__p0_113, __p1_113, __p2_113) __extension__ ({ \
  19771   int16x4_t __ret_113; \
  19772   int16x4_t __s0_113 = __p0_113; \
  19773   int16x4_t __s1_113 = __p1_113; \
  19774   int16x4_t __rev0_113;  __rev0_113 = __builtin_shufflevector(__s0_113, __s0_113, 3, 2, 1, 0); \
  19775   int16x4_t __rev1_113;  __rev1_113 = __builtin_shufflevector(__s1_113, __s1_113, 3, 2, 1, 0); \
  19776   __ret_113 = __rev0_113 * __noswap_splat_lane_s16(__rev1_113, __p2_113); \
  19777   __ret_113 = __builtin_shufflevector(__ret_113, __ret_113, 3, 2, 1, 0); \
  19778   __ret_113; \
  19779 })
  19780 #endif
  19781 
  19782 #ifdef __LITTLE_ENDIAN__
  19783 __ai __attribute__((target("neon"))) uint32x4_t vmulq_n_u32(uint32x4_t __p0, uint32_t __p1) {
  19784   uint32x4_t __ret;
  19785   __ret = __p0 * (uint32x4_t) {__p1, __p1, __p1, __p1};
  19786   return __ret;
  19787 }
  19788 #else
  19789 __ai __attribute__((target("neon"))) uint32x4_t vmulq_n_u32(uint32x4_t __p0, uint32_t __p1) {
  19790   uint32x4_t __ret;
  19791   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19792   __ret = __rev0 * (uint32x4_t) {__p1, __p1, __p1, __p1};
  19793   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19794   return __ret;
  19795 }
  19796 #endif
  19797 
  19798 #ifdef __LITTLE_ENDIAN__
  19799 __ai __attribute__((target("neon"))) uint16x8_t vmulq_n_u16(uint16x8_t __p0, uint16_t __p1) {
  19800   uint16x8_t __ret;
  19801   __ret = __p0 * (uint16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1};
  19802   return __ret;
  19803 }
  19804 #else
  19805 __ai __attribute__((target("neon"))) uint16x8_t vmulq_n_u16(uint16x8_t __p0, uint16_t __p1) {
  19806   uint16x8_t __ret;
  19807   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19808   __ret = __rev0 * (uint16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1};
  19809   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19810   return __ret;
  19811 }
  19812 #endif
  19813 
  19814 #ifdef __LITTLE_ENDIAN__
  19815 __ai __attribute__((target("neon"))) float32x4_t vmulq_n_f32(float32x4_t __p0, float32_t __p1) {
  19816   float32x4_t __ret;
  19817   __ret = __p0 * (float32x4_t) {__p1, __p1, __p1, __p1};
  19818   return __ret;
  19819 }
  19820 #else
  19821 __ai __attribute__((target("neon"))) float32x4_t vmulq_n_f32(float32x4_t __p0, float32_t __p1) {
  19822   float32x4_t __ret;
  19823   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19824   __ret = __rev0 * (float32x4_t) {__p1, __p1, __p1, __p1};
  19825   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19826   return __ret;
  19827 }
  19828 #endif
  19829 
  19830 #ifdef __LITTLE_ENDIAN__
  19831 __ai __attribute__((target("neon"))) int32x4_t vmulq_n_s32(int32x4_t __p0, int32_t __p1) {
  19832   int32x4_t __ret;
  19833   __ret = __p0 * (int32x4_t) {__p1, __p1, __p1, __p1};
  19834   return __ret;
  19835 }
  19836 #else
  19837 __ai __attribute__((target("neon"))) int32x4_t vmulq_n_s32(int32x4_t __p0, int32_t __p1) {
  19838   int32x4_t __ret;
  19839   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19840   __ret = __rev0 * (int32x4_t) {__p1, __p1, __p1, __p1};
  19841   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19842   return __ret;
  19843 }
  19844 #endif
  19845 
  19846 #ifdef __LITTLE_ENDIAN__
  19847 __ai __attribute__((target("neon"))) int16x8_t vmulq_n_s16(int16x8_t __p0, int16_t __p1) {
  19848   int16x8_t __ret;
  19849   __ret = __p0 * (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1};
  19850   return __ret;
  19851 }
  19852 #else
  19853 __ai __attribute__((target("neon"))) int16x8_t vmulq_n_s16(int16x8_t __p0, int16_t __p1) {
  19854   int16x8_t __ret;
  19855   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19856   __ret = __rev0 * (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1};
  19857   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19858   return __ret;
  19859 }
  19860 #endif
  19861 
  19862 #ifdef __LITTLE_ENDIAN__
  19863 __ai __attribute__((target("neon"))) uint32x2_t vmul_n_u32(uint32x2_t __p0, uint32_t __p1) {
  19864   uint32x2_t __ret;
  19865   __ret = __p0 * (uint32x2_t) {__p1, __p1};
  19866   return __ret;
  19867 }
  19868 #else
  19869 __ai __attribute__((target("neon"))) uint32x2_t vmul_n_u32(uint32x2_t __p0, uint32_t __p1) {
  19870   uint32x2_t __ret;
  19871   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19872   __ret = __rev0 * (uint32x2_t) {__p1, __p1};
  19873   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19874   return __ret;
  19875 }
  19876 #endif
  19877 
  19878 #ifdef __LITTLE_ENDIAN__
  19879 __ai __attribute__((target("neon"))) uint16x4_t vmul_n_u16(uint16x4_t __p0, uint16_t __p1) {
  19880   uint16x4_t __ret;
  19881   __ret = __p0 * (uint16x4_t) {__p1, __p1, __p1, __p1};
  19882   return __ret;
  19883 }
  19884 #else
  19885 __ai __attribute__((target("neon"))) uint16x4_t vmul_n_u16(uint16x4_t __p0, uint16_t __p1) {
  19886   uint16x4_t __ret;
  19887   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19888   __ret = __rev0 * (uint16x4_t) {__p1, __p1, __p1, __p1};
  19889   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19890   return __ret;
  19891 }
  19892 #endif
  19893 
  19894 #ifdef __LITTLE_ENDIAN__
  19895 __ai __attribute__((target("neon"))) float32x2_t vmul_n_f32(float32x2_t __p0, float32_t __p1) {
  19896   float32x2_t __ret;
  19897   __ret = __p0 * (float32x2_t) {__p1, __p1};
  19898   return __ret;
  19899 }
  19900 #else
  19901 __ai __attribute__((target("neon"))) float32x2_t vmul_n_f32(float32x2_t __p0, float32_t __p1) {
  19902   float32x2_t __ret;
  19903   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19904   __ret = __rev0 * (float32x2_t) {__p1, __p1};
  19905   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19906   return __ret;
  19907 }
  19908 #endif
  19909 
  19910 #ifdef __LITTLE_ENDIAN__
  19911 __ai __attribute__((target("neon"))) int32x2_t vmul_n_s32(int32x2_t __p0, int32_t __p1) {
  19912   int32x2_t __ret;
  19913   __ret = __p0 * (int32x2_t) {__p1, __p1};
  19914   return __ret;
  19915 }
  19916 #else
  19917 __ai __attribute__((target("neon"))) int32x2_t vmul_n_s32(int32x2_t __p0, int32_t __p1) {
  19918   int32x2_t __ret;
  19919   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19920   __ret = __rev0 * (int32x2_t) {__p1, __p1};
  19921   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19922   return __ret;
  19923 }
  19924 #endif
  19925 
  19926 #ifdef __LITTLE_ENDIAN__
  19927 __ai __attribute__((target("neon"))) int16x4_t vmul_n_s16(int16x4_t __p0, int16_t __p1) {
  19928   int16x4_t __ret;
  19929   __ret = __p0 * (int16x4_t) {__p1, __p1, __p1, __p1};
  19930   return __ret;
  19931 }
  19932 #else
  19933 __ai __attribute__((target("neon"))) int16x4_t vmul_n_s16(int16x4_t __p0, int16_t __p1) {
  19934   int16x4_t __ret;
  19935   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  19936   __ret = __rev0 * (int16x4_t) {__p1, __p1, __p1, __p1};
  19937   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  19938   return __ret;
  19939 }
  19940 #endif
  19941 
  19942 #ifdef __LITTLE_ENDIAN__
  19943 __ai __attribute__((target("neon"))) poly16x8_t vmull_p8(poly8x8_t __p0, poly8x8_t __p1) {
  19944   poly16x8_t __ret;
  19945   __ret = (poly16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 37);
  19946   return __ret;
  19947 }
  19948 #else
  19949 __ai __attribute__((target("neon"))) poly16x8_t vmull_p8(poly8x8_t __p0, poly8x8_t __p1) {
  19950   poly16x8_t __ret;
  19951   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19952   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19953   __ret = (poly16x8_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 37);
  19954   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19955   return __ret;
  19956 }
  19957 __ai __attribute__((target("neon"))) poly16x8_t __noswap_vmull_p8(poly8x8_t __p0, poly8x8_t __p1) {
  19958   poly16x8_t __ret;
  19959   __ret = (poly16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 37);
  19960   return __ret;
  19961 }
  19962 #endif
  19963 
  19964 #ifdef __LITTLE_ENDIAN__
  19965 __ai __attribute__((target("neon"))) uint16x8_t vmull_u8(uint8x8_t __p0, uint8x8_t __p1) {
  19966   uint16x8_t __ret;
  19967   __ret = (uint16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 49);
  19968   return __ret;
  19969 }
  19970 #else
  19971 __ai __attribute__((target("neon"))) uint16x8_t vmull_u8(uint8x8_t __p0, uint8x8_t __p1) {
  19972   uint16x8_t __ret;
  19973   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  19974   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  19975   __ret = (uint16x8_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 49);
  19976   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  19977   return __ret;
  19978 }
  19979 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmull_u8(uint8x8_t __p0, uint8x8_t __p1) {
  19980   uint16x8_t __ret;
  19981   __ret = (uint16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 49);
  19982   return __ret;
  19983 }
  19984 #endif
  19985 
  19986 #ifdef __LITTLE_ENDIAN__
  19987 __ai __attribute__((target("neon"))) uint64x2_t vmull_u32(uint32x2_t __p0, uint32x2_t __p1) {
  19988   uint64x2_t __ret;
  19989   __ret = (uint64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 51);
  19990   return __ret;
  19991 }
  19992 #else
  19993 __ai __attribute__((target("neon"))) uint64x2_t vmull_u32(uint32x2_t __p0, uint32x2_t __p1) {
  19994   uint64x2_t __ret;
  19995   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  19996   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  19997   __ret = (uint64x2_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 51);
  19998   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  19999   return __ret;
  20000 }
  20001 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmull_u32(uint32x2_t __p0, uint32x2_t __p1) {
  20002   uint64x2_t __ret;
  20003   __ret = (uint64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 51);
  20004   return __ret;
  20005 }
  20006 #endif
  20007 
  20008 #ifdef __LITTLE_ENDIAN__
  20009 __ai __attribute__((target("neon"))) uint32x4_t vmull_u16(uint16x4_t __p0, uint16x4_t __p1) {
  20010   uint32x4_t __ret;
  20011   __ret = (uint32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 50);
  20012   return __ret;
  20013 }
  20014 #else
  20015 __ai __attribute__((target("neon"))) uint32x4_t vmull_u16(uint16x4_t __p0, uint16x4_t __p1) {
  20016   uint32x4_t __ret;
  20017   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20018   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20019   __ret = (uint32x4_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 50);
  20020   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20021   return __ret;
  20022 }
  20023 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmull_u16(uint16x4_t __p0, uint16x4_t __p1) {
  20024   uint32x4_t __ret;
  20025   __ret = (uint32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 50);
  20026   return __ret;
  20027 }
  20028 #endif
  20029 
  20030 #ifdef __LITTLE_ENDIAN__
  20031 __ai __attribute__((target("neon"))) int16x8_t vmull_s8(int8x8_t __p0, int8x8_t __p1) {
  20032   int16x8_t __ret;
  20033   __ret = (int16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 33);
  20034   return __ret;
  20035 }
  20036 #else
  20037 __ai __attribute__((target("neon"))) int16x8_t vmull_s8(int8x8_t __p0, int8x8_t __p1) {
  20038   int16x8_t __ret;
  20039   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20040   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20041   __ret = (int16x8_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 33);
  20042   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20043   return __ret;
  20044 }
  20045 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmull_s8(int8x8_t __p0, int8x8_t __p1) {
  20046   int16x8_t __ret;
  20047   __ret = (int16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 33);
  20048   return __ret;
  20049 }
  20050 #endif
  20051 
  20052 #ifdef __LITTLE_ENDIAN__
  20053 __ai __attribute__((target("neon"))) int64x2_t vmull_s32(int32x2_t __p0, int32x2_t __p1) {
  20054   int64x2_t __ret;
  20055   __ret = (int64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35);
  20056   return __ret;
  20057 }
  20058 #else
  20059 __ai __attribute__((target("neon"))) int64x2_t vmull_s32(int32x2_t __p0, int32x2_t __p1) {
  20060   int64x2_t __ret;
  20061   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20062   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20063   __ret = (int64x2_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 35);
  20064   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20065   return __ret;
  20066 }
  20067 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmull_s32(int32x2_t __p0, int32x2_t __p1) {
  20068   int64x2_t __ret;
  20069   __ret = (int64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35);
  20070   return __ret;
  20071 }
  20072 #endif
  20073 
  20074 #ifdef __LITTLE_ENDIAN__
  20075 __ai __attribute__((target("neon"))) int32x4_t vmull_s16(int16x4_t __p0, int16x4_t __p1) {
  20076   int32x4_t __ret;
  20077   __ret = (int32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34);
  20078   return __ret;
  20079 }
  20080 #else
  20081 __ai __attribute__((target("neon"))) int32x4_t vmull_s16(int16x4_t __p0, int16x4_t __p1) {
  20082   int32x4_t __ret;
  20083   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20084   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20085   __ret = (int32x4_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 34);
  20086   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20087   return __ret;
  20088 }
  20089 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmull_s16(int16x4_t __p0, int16x4_t __p1) {
  20090   int32x4_t __ret;
  20091   __ret = (int32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34);
  20092   return __ret;
  20093 }
  20094 #endif
  20095 
  20096 #ifdef __LITTLE_ENDIAN__
  20097 #define vmull_lane_u32(__p0_114, __p1_114, __p2_114) __extension__ ({ \
  20098   uint64x2_t __ret_114; \
  20099   uint32x2_t __s0_114 = __p0_114; \
  20100   uint32x2_t __s1_114 = __p1_114; \
  20101   __ret_114 = vmull_u32(__s0_114, splat_lane_u32(__s1_114, __p2_114)); \
  20102   __ret_114; \
  20103 })
  20104 #else
  20105 #define vmull_lane_u32(__p0_115, __p1_115, __p2_115) __extension__ ({ \
  20106   uint64x2_t __ret_115; \
  20107   uint32x2_t __s0_115 = __p0_115; \
  20108   uint32x2_t __s1_115 = __p1_115; \
  20109   uint32x2_t __rev0_115;  __rev0_115 = __builtin_shufflevector(__s0_115, __s0_115, 1, 0); \
  20110   uint32x2_t __rev1_115;  __rev1_115 = __builtin_shufflevector(__s1_115, __s1_115, 1, 0); \
  20111   __ret_115 = __noswap_vmull_u32(__rev0_115, __noswap_splat_lane_u32(__rev1_115, __p2_115)); \
  20112   __ret_115 = __builtin_shufflevector(__ret_115, __ret_115, 1, 0); \
  20113   __ret_115; \
  20114 })
  20115 #endif
  20116 
  20117 #ifdef __LITTLE_ENDIAN__
  20118 #define vmull_lane_u16(__p0_116, __p1_116, __p2_116) __extension__ ({ \
  20119   uint32x4_t __ret_116; \
  20120   uint16x4_t __s0_116 = __p0_116; \
  20121   uint16x4_t __s1_116 = __p1_116; \
  20122   __ret_116 = vmull_u16(__s0_116, splat_lane_u16(__s1_116, __p2_116)); \
  20123   __ret_116; \
  20124 })
  20125 #else
  20126 #define vmull_lane_u16(__p0_117, __p1_117, __p2_117) __extension__ ({ \
  20127   uint32x4_t __ret_117; \
  20128   uint16x4_t __s0_117 = __p0_117; \
  20129   uint16x4_t __s1_117 = __p1_117; \
  20130   uint16x4_t __rev0_117;  __rev0_117 = __builtin_shufflevector(__s0_117, __s0_117, 3, 2, 1, 0); \
  20131   uint16x4_t __rev1_117;  __rev1_117 = __builtin_shufflevector(__s1_117, __s1_117, 3, 2, 1, 0); \
  20132   __ret_117 = __noswap_vmull_u16(__rev0_117, __noswap_splat_lane_u16(__rev1_117, __p2_117)); \
  20133   __ret_117 = __builtin_shufflevector(__ret_117, __ret_117, 3, 2, 1, 0); \
  20134   __ret_117; \
  20135 })
  20136 #endif
  20137 
  20138 #ifdef __LITTLE_ENDIAN__
  20139 #define vmull_lane_s32(__p0_118, __p1_118, __p2_118) __extension__ ({ \
  20140   int64x2_t __ret_118; \
  20141   int32x2_t __s0_118 = __p0_118; \
  20142   int32x2_t __s1_118 = __p1_118; \
  20143   __ret_118 = vmull_s32(__s0_118, splat_lane_s32(__s1_118, __p2_118)); \
  20144   __ret_118; \
  20145 })
  20146 #else
  20147 #define vmull_lane_s32(__p0_119, __p1_119, __p2_119) __extension__ ({ \
  20148   int64x2_t __ret_119; \
  20149   int32x2_t __s0_119 = __p0_119; \
  20150   int32x2_t __s1_119 = __p1_119; \
  20151   int32x2_t __rev0_119;  __rev0_119 = __builtin_shufflevector(__s0_119, __s0_119, 1, 0); \
  20152   int32x2_t __rev1_119;  __rev1_119 = __builtin_shufflevector(__s1_119, __s1_119, 1, 0); \
  20153   __ret_119 = __noswap_vmull_s32(__rev0_119, __noswap_splat_lane_s32(__rev1_119, __p2_119)); \
  20154   __ret_119 = __builtin_shufflevector(__ret_119, __ret_119, 1, 0); \
  20155   __ret_119; \
  20156 })
  20157 #endif
  20158 
  20159 #ifdef __LITTLE_ENDIAN__
  20160 #define vmull_lane_s16(__p0_120, __p1_120, __p2_120) __extension__ ({ \
  20161   int32x4_t __ret_120; \
  20162   int16x4_t __s0_120 = __p0_120; \
  20163   int16x4_t __s1_120 = __p1_120; \
  20164   __ret_120 = vmull_s16(__s0_120, splat_lane_s16(__s1_120, __p2_120)); \
  20165   __ret_120; \
  20166 })
  20167 #else
  20168 #define vmull_lane_s16(__p0_121, __p1_121, __p2_121) __extension__ ({ \
  20169   int32x4_t __ret_121; \
  20170   int16x4_t __s0_121 = __p0_121; \
  20171   int16x4_t __s1_121 = __p1_121; \
  20172   int16x4_t __rev0_121;  __rev0_121 = __builtin_shufflevector(__s0_121, __s0_121, 3, 2, 1, 0); \
  20173   int16x4_t __rev1_121;  __rev1_121 = __builtin_shufflevector(__s1_121, __s1_121, 3, 2, 1, 0); \
  20174   __ret_121 = __noswap_vmull_s16(__rev0_121, __noswap_splat_lane_s16(__rev1_121, __p2_121)); \
  20175   __ret_121 = __builtin_shufflevector(__ret_121, __ret_121, 3, 2, 1, 0); \
  20176   __ret_121; \
  20177 })
  20178 #endif
  20179 
  20180 #ifdef __LITTLE_ENDIAN__
  20181 __ai __attribute__((target("neon"))) uint64x2_t vmull_n_u32(uint32x2_t __p0, uint32_t __p1) {
  20182   uint64x2_t __ret;
  20183   __ret = vmull_u32(__p0, (uint32x2_t) {__p1, __p1});
  20184   return __ret;
  20185 }
  20186 #else
  20187 __ai __attribute__((target("neon"))) uint64x2_t vmull_n_u32(uint32x2_t __p0, uint32_t __p1) {
  20188   uint64x2_t __ret;
  20189   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20190   __ret = __noswap_vmull_u32(__rev0, (uint32x2_t) {__p1, __p1});
  20191   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20192   return __ret;
  20193 }
  20194 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmull_n_u32(uint32x2_t __p0, uint32_t __p1) {
  20195   uint64x2_t __ret;
  20196   __ret = __noswap_vmull_u32(__p0, (uint32x2_t) {__p1, __p1});
  20197   return __ret;
  20198 }
  20199 #endif
  20200 
  20201 #ifdef __LITTLE_ENDIAN__
  20202 __ai __attribute__((target("neon"))) uint32x4_t vmull_n_u16(uint16x4_t __p0, uint16_t __p1) {
  20203   uint32x4_t __ret;
  20204   __ret = vmull_u16(__p0, (uint16x4_t) {__p1, __p1, __p1, __p1});
  20205   return __ret;
  20206 }
  20207 #else
  20208 __ai __attribute__((target("neon"))) uint32x4_t vmull_n_u16(uint16x4_t __p0, uint16_t __p1) {
  20209   uint32x4_t __ret;
  20210   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20211   __ret = __noswap_vmull_u16(__rev0, (uint16x4_t) {__p1, __p1, __p1, __p1});
  20212   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20213   return __ret;
  20214 }
  20215 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmull_n_u16(uint16x4_t __p0, uint16_t __p1) {
  20216   uint32x4_t __ret;
  20217   __ret = __noswap_vmull_u16(__p0, (uint16x4_t) {__p1, __p1, __p1, __p1});
  20218   return __ret;
  20219 }
  20220 #endif
  20221 
  20222 #ifdef __LITTLE_ENDIAN__
  20223 __ai __attribute__((target("neon"))) int64x2_t vmull_n_s32(int32x2_t __p0, int32_t __p1) {
  20224   int64x2_t __ret;
  20225   __ret = vmull_s32(__p0, (int32x2_t) {__p1, __p1});
  20226   return __ret;
  20227 }
  20228 #else
  20229 __ai __attribute__((target("neon"))) int64x2_t vmull_n_s32(int32x2_t __p0, int32_t __p1) {
  20230   int64x2_t __ret;
  20231   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20232   __ret = __noswap_vmull_s32(__rev0, (int32x2_t) {__p1, __p1});
  20233   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20234   return __ret;
  20235 }
  20236 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmull_n_s32(int32x2_t __p0, int32_t __p1) {
  20237   int64x2_t __ret;
  20238   __ret = __noswap_vmull_s32(__p0, (int32x2_t) {__p1, __p1});
  20239   return __ret;
  20240 }
  20241 #endif
  20242 
  20243 #ifdef __LITTLE_ENDIAN__
  20244 __ai __attribute__((target("neon"))) int32x4_t vmull_n_s16(int16x4_t __p0, int16_t __p1) {
  20245   int32x4_t __ret;
  20246   __ret = vmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1});
  20247   return __ret;
  20248 }
  20249 #else
  20250 __ai __attribute__((target("neon"))) int32x4_t vmull_n_s16(int16x4_t __p0, int16_t __p1) {
  20251   int32x4_t __ret;
  20252   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20253   __ret = __noswap_vmull_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1});
  20254   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20255   return __ret;
  20256 }
  20257 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmull_n_s16(int16x4_t __p0, int16_t __p1) {
  20258   int32x4_t __ret;
  20259   __ret = __noswap_vmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1});
  20260   return __ret;
  20261 }
  20262 #endif
  20263 
  20264 #ifdef __LITTLE_ENDIAN__
  20265 __ai __attribute__((target("neon"))) poly8x8_t vmvn_p8(poly8x8_t __p0) {
  20266   poly8x8_t __ret;
  20267   __ret = ~__p0;
  20268   return __ret;
  20269 }
  20270 #else
  20271 __ai __attribute__((target("neon"))) poly8x8_t vmvn_p8(poly8x8_t __p0) {
  20272   poly8x8_t __ret;
  20273   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20274   __ret = ~__rev0;
  20275   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20276   return __ret;
  20277 }
  20278 #endif
  20279 
  20280 #ifdef __LITTLE_ENDIAN__
  20281 __ai __attribute__((target("neon"))) poly8x16_t vmvnq_p8(poly8x16_t __p0) {
  20282   poly8x16_t __ret;
  20283   __ret = ~__p0;
  20284   return __ret;
  20285 }
  20286 #else
  20287 __ai __attribute__((target("neon"))) poly8x16_t vmvnq_p8(poly8x16_t __p0) {
  20288   poly8x16_t __ret;
  20289   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20290   __ret = ~__rev0;
  20291   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20292   return __ret;
  20293 }
  20294 #endif
  20295 
  20296 #ifdef __LITTLE_ENDIAN__
  20297 __ai __attribute__((target("neon"))) uint8x16_t vmvnq_u8(uint8x16_t __p0) {
  20298   uint8x16_t __ret;
  20299   __ret = ~__p0;
  20300   return __ret;
  20301 }
  20302 #else
  20303 __ai __attribute__((target("neon"))) uint8x16_t vmvnq_u8(uint8x16_t __p0) {
  20304   uint8x16_t __ret;
  20305   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20306   __ret = ~__rev0;
  20307   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20308   return __ret;
  20309 }
  20310 #endif
  20311 
  20312 #ifdef __LITTLE_ENDIAN__
  20313 __ai __attribute__((target("neon"))) uint32x4_t vmvnq_u32(uint32x4_t __p0) {
  20314   uint32x4_t __ret;
  20315   __ret = ~__p0;
  20316   return __ret;
  20317 }
  20318 #else
  20319 __ai __attribute__((target("neon"))) uint32x4_t vmvnq_u32(uint32x4_t __p0) {
  20320   uint32x4_t __ret;
  20321   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20322   __ret = ~__rev0;
  20323   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20324   return __ret;
  20325 }
  20326 #endif
  20327 
  20328 #ifdef __LITTLE_ENDIAN__
  20329 __ai __attribute__((target("neon"))) uint16x8_t vmvnq_u16(uint16x8_t __p0) {
  20330   uint16x8_t __ret;
  20331   __ret = ~__p0;
  20332   return __ret;
  20333 }
  20334 #else
  20335 __ai __attribute__((target("neon"))) uint16x8_t vmvnq_u16(uint16x8_t __p0) {
  20336   uint16x8_t __ret;
  20337   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20338   __ret = ~__rev0;
  20339   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20340   return __ret;
  20341 }
  20342 #endif
  20343 
  20344 #ifdef __LITTLE_ENDIAN__
  20345 __ai __attribute__((target("neon"))) int8x16_t vmvnq_s8(int8x16_t __p0) {
  20346   int8x16_t __ret;
  20347   __ret = ~__p0;
  20348   return __ret;
  20349 }
  20350 #else
  20351 __ai __attribute__((target("neon"))) int8x16_t vmvnq_s8(int8x16_t __p0) {
  20352   int8x16_t __ret;
  20353   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20354   __ret = ~__rev0;
  20355   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20356   return __ret;
  20357 }
  20358 #endif
  20359 
  20360 #ifdef __LITTLE_ENDIAN__
  20361 __ai __attribute__((target("neon"))) int32x4_t vmvnq_s32(int32x4_t __p0) {
  20362   int32x4_t __ret;
  20363   __ret = ~__p0;
  20364   return __ret;
  20365 }
  20366 #else
  20367 __ai __attribute__((target("neon"))) int32x4_t vmvnq_s32(int32x4_t __p0) {
  20368   int32x4_t __ret;
  20369   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20370   __ret = ~__rev0;
  20371   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20372   return __ret;
  20373 }
  20374 #endif
  20375 
  20376 #ifdef __LITTLE_ENDIAN__
  20377 __ai __attribute__((target("neon"))) int16x8_t vmvnq_s16(int16x8_t __p0) {
  20378   int16x8_t __ret;
  20379   __ret = ~__p0;
  20380   return __ret;
  20381 }
  20382 #else
  20383 __ai __attribute__((target("neon"))) int16x8_t vmvnq_s16(int16x8_t __p0) {
  20384   int16x8_t __ret;
  20385   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20386   __ret = ~__rev0;
  20387   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20388   return __ret;
  20389 }
  20390 #endif
  20391 
  20392 #ifdef __LITTLE_ENDIAN__
  20393 __ai __attribute__((target("neon"))) uint8x8_t vmvn_u8(uint8x8_t __p0) {
  20394   uint8x8_t __ret;
  20395   __ret = ~__p0;
  20396   return __ret;
  20397 }
  20398 #else
  20399 __ai __attribute__((target("neon"))) uint8x8_t vmvn_u8(uint8x8_t __p0) {
  20400   uint8x8_t __ret;
  20401   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20402   __ret = ~__rev0;
  20403   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20404   return __ret;
  20405 }
  20406 #endif
  20407 
  20408 #ifdef __LITTLE_ENDIAN__
  20409 __ai __attribute__((target("neon"))) uint32x2_t vmvn_u32(uint32x2_t __p0) {
  20410   uint32x2_t __ret;
  20411   __ret = ~__p0;
  20412   return __ret;
  20413 }
  20414 #else
  20415 __ai __attribute__((target("neon"))) uint32x2_t vmvn_u32(uint32x2_t __p0) {
  20416   uint32x2_t __ret;
  20417   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20418   __ret = ~__rev0;
  20419   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20420   return __ret;
  20421 }
  20422 #endif
  20423 
  20424 #ifdef __LITTLE_ENDIAN__
  20425 __ai __attribute__((target("neon"))) uint16x4_t vmvn_u16(uint16x4_t __p0) {
  20426   uint16x4_t __ret;
  20427   __ret = ~__p0;
  20428   return __ret;
  20429 }
  20430 #else
  20431 __ai __attribute__((target("neon"))) uint16x4_t vmvn_u16(uint16x4_t __p0) {
  20432   uint16x4_t __ret;
  20433   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20434   __ret = ~__rev0;
  20435   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20436   return __ret;
  20437 }
  20438 #endif
  20439 
  20440 #ifdef __LITTLE_ENDIAN__
  20441 __ai __attribute__((target("neon"))) int8x8_t vmvn_s8(int8x8_t __p0) {
  20442   int8x8_t __ret;
  20443   __ret = ~__p0;
  20444   return __ret;
  20445 }
  20446 #else
  20447 __ai __attribute__((target("neon"))) int8x8_t vmvn_s8(int8x8_t __p0) {
  20448   int8x8_t __ret;
  20449   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20450   __ret = ~__rev0;
  20451   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20452   return __ret;
  20453 }
  20454 #endif
  20455 
  20456 #ifdef __LITTLE_ENDIAN__
  20457 __ai __attribute__((target("neon"))) int32x2_t vmvn_s32(int32x2_t __p0) {
  20458   int32x2_t __ret;
  20459   __ret = ~__p0;
  20460   return __ret;
  20461 }
  20462 #else
  20463 __ai __attribute__((target("neon"))) int32x2_t vmvn_s32(int32x2_t __p0) {
  20464   int32x2_t __ret;
  20465   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20466   __ret = ~__rev0;
  20467   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20468   return __ret;
  20469 }
  20470 #endif
  20471 
  20472 #ifdef __LITTLE_ENDIAN__
  20473 __ai __attribute__((target("neon"))) int16x4_t vmvn_s16(int16x4_t __p0) {
  20474   int16x4_t __ret;
  20475   __ret = ~__p0;
  20476   return __ret;
  20477 }
  20478 #else
  20479 __ai __attribute__((target("neon"))) int16x4_t vmvn_s16(int16x4_t __p0) {
  20480   int16x4_t __ret;
  20481   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20482   __ret = ~__rev0;
  20483   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20484   return __ret;
  20485 }
  20486 #endif
  20487 
  20488 #ifdef __LITTLE_ENDIAN__
  20489 __ai __attribute__((target("neon"))) int8x16_t vnegq_s8(int8x16_t __p0) {
  20490   int8x16_t __ret;
  20491   __ret = -__p0;
  20492   return __ret;
  20493 }
  20494 #else
  20495 __ai __attribute__((target("neon"))) int8x16_t vnegq_s8(int8x16_t __p0) {
  20496   int8x16_t __ret;
  20497   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20498   __ret = -__rev0;
  20499   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20500   return __ret;
  20501 }
  20502 #endif
  20503 
  20504 #ifdef __LITTLE_ENDIAN__
  20505 __ai __attribute__((target("neon"))) float32x4_t vnegq_f32(float32x4_t __p0) {
  20506   float32x4_t __ret;
  20507   __ret = -__p0;
  20508   return __ret;
  20509 }
  20510 #else
  20511 __ai __attribute__((target("neon"))) float32x4_t vnegq_f32(float32x4_t __p0) {
  20512   float32x4_t __ret;
  20513   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20514   __ret = -__rev0;
  20515   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20516   return __ret;
  20517 }
  20518 #endif
  20519 
  20520 #ifdef __LITTLE_ENDIAN__
  20521 __ai __attribute__((target("neon"))) int32x4_t vnegq_s32(int32x4_t __p0) {
  20522   int32x4_t __ret;
  20523   __ret = -__p0;
  20524   return __ret;
  20525 }
  20526 #else
  20527 __ai __attribute__((target("neon"))) int32x4_t vnegq_s32(int32x4_t __p0) {
  20528   int32x4_t __ret;
  20529   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20530   __ret = -__rev0;
  20531   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20532   return __ret;
  20533 }
  20534 #endif
  20535 
  20536 #ifdef __LITTLE_ENDIAN__
  20537 __ai __attribute__((target("neon"))) int16x8_t vnegq_s16(int16x8_t __p0) {
  20538   int16x8_t __ret;
  20539   __ret = -__p0;
  20540   return __ret;
  20541 }
  20542 #else
  20543 __ai __attribute__((target("neon"))) int16x8_t vnegq_s16(int16x8_t __p0) {
  20544   int16x8_t __ret;
  20545   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20546   __ret = -__rev0;
  20547   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20548   return __ret;
  20549 }
  20550 #endif
  20551 
  20552 #ifdef __LITTLE_ENDIAN__
  20553 __ai __attribute__((target("neon"))) int8x8_t vneg_s8(int8x8_t __p0) {
  20554   int8x8_t __ret;
  20555   __ret = -__p0;
  20556   return __ret;
  20557 }
  20558 #else
  20559 __ai __attribute__((target("neon"))) int8x8_t vneg_s8(int8x8_t __p0) {
  20560   int8x8_t __ret;
  20561   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20562   __ret = -__rev0;
  20563   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20564   return __ret;
  20565 }
  20566 #endif
  20567 
  20568 #ifdef __LITTLE_ENDIAN__
  20569 __ai __attribute__((target("neon"))) float32x2_t vneg_f32(float32x2_t __p0) {
  20570   float32x2_t __ret;
  20571   __ret = -__p0;
  20572   return __ret;
  20573 }
  20574 #else
  20575 __ai __attribute__((target("neon"))) float32x2_t vneg_f32(float32x2_t __p0) {
  20576   float32x2_t __ret;
  20577   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20578   __ret = -__rev0;
  20579   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20580   return __ret;
  20581 }
  20582 #endif
  20583 
  20584 #ifdef __LITTLE_ENDIAN__
  20585 __ai __attribute__((target("neon"))) int32x2_t vneg_s32(int32x2_t __p0) {
  20586   int32x2_t __ret;
  20587   __ret = -__p0;
  20588   return __ret;
  20589 }
  20590 #else
  20591 __ai __attribute__((target("neon"))) int32x2_t vneg_s32(int32x2_t __p0) {
  20592   int32x2_t __ret;
  20593   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20594   __ret = -__rev0;
  20595   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20596   return __ret;
  20597 }
  20598 #endif
  20599 
  20600 #ifdef __LITTLE_ENDIAN__
  20601 __ai __attribute__((target("neon"))) int16x4_t vneg_s16(int16x4_t __p0) {
  20602   int16x4_t __ret;
  20603   __ret = -__p0;
  20604   return __ret;
  20605 }
  20606 #else
  20607 __ai __attribute__((target("neon"))) int16x4_t vneg_s16(int16x4_t __p0) {
  20608   int16x4_t __ret;
  20609   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20610   __ret = -__rev0;
  20611   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20612   return __ret;
  20613 }
  20614 #endif
  20615 
  20616 #ifdef __LITTLE_ENDIAN__
  20617 __ai __attribute__((target("neon"))) uint8x16_t vornq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  20618   uint8x16_t __ret;
  20619   __ret = __p0 | ~__p1;
  20620   return __ret;
  20621 }
  20622 #else
  20623 __ai __attribute__((target("neon"))) uint8x16_t vornq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  20624   uint8x16_t __ret;
  20625   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20626   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20627   __ret = __rev0 | ~__rev1;
  20628   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20629   return __ret;
  20630 }
  20631 #endif
  20632 
  20633 #ifdef __LITTLE_ENDIAN__
  20634 __ai __attribute__((target("neon"))) uint32x4_t vornq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  20635   uint32x4_t __ret;
  20636   __ret = __p0 | ~__p1;
  20637   return __ret;
  20638 }
  20639 #else
  20640 __ai __attribute__((target("neon"))) uint32x4_t vornq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  20641   uint32x4_t __ret;
  20642   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20643   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20644   __ret = __rev0 | ~__rev1;
  20645   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20646   return __ret;
  20647 }
  20648 #endif
  20649 
  20650 #ifdef __LITTLE_ENDIAN__
  20651 __ai __attribute__((target("neon"))) uint64x2_t vornq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  20652   uint64x2_t __ret;
  20653   __ret = __p0 | ~__p1;
  20654   return __ret;
  20655 }
  20656 #else
  20657 __ai __attribute__((target("neon"))) uint64x2_t vornq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  20658   uint64x2_t __ret;
  20659   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20660   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20661   __ret = __rev0 | ~__rev1;
  20662   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20663   return __ret;
  20664 }
  20665 #endif
  20666 
  20667 #ifdef __LITTLE_ENDIAN__
  20668 __ai __attribute__((target("neon"))) uint16x8_t vornq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  20669   uint16x8_t __ret;
  20670   __ret = __p0 | ~__p1;
  20671   return __ret;
  20672 }
  20673 #else
  20674 __ai __attribute__((target("neon"))) uint16x8_t vornq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  20675   uint16x8_t __ret;
  20676   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20677   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20678   __ret = __rev0 | ~__rev1;
  20679   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20680   return __ret;
  20681 }
  20682 #endif
  20683 
  20684 #ifdef __LITTLE_ENDIAN__
  20685 __ai __attribute__((target("neon"))) int8x16_t vornq_s8(int8x16_t __p0, int8x16_t __p1) {
  20686   int8x16_t __ret;
  20687   __ret = __p0 | ~__p1;
  20688   return __ret;
  20689 }
  20690 #else
  20691 __ai __attribute__((target("neon"))) int8x16_t vornq_s8(int8x16_t __p0, int8x16_t __p1) {
  20692   int8x16_t __ret;
  20693   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20694   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20695   __ret = __rev0 | ~__rev1;
  20696   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20697   return __ret;
  20698 }
  20699 #endif
  20700 
  20701 #ifdef __LITTLE_ENDIAN__
  20702 __ai __attribute__((target("neon"))) int32x4_t vornq_s32(int32x4_t __p0, int32x4_t __p1) {
  20703   int32x4_t __ret;
  20704   __ret = __p0 | ~__p1;
  20705   return __ret;
  20706 }
  20707 #else
  20708 __ai __attribute__((target("neon"))) int32x4_t vornq_s32(int32x4_t __p0, int32x4_t __p1) {
  20709   int32x4_t __ret;
  20710   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20711   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20712   __ret = __rev0 | ~__rev1;
  20713   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20714   return __ret;
  20715 }
  20716 #endif
  20717 
  20718 #ifdef __LITTLE_ENDIAN__
  20719 __ai __attribute__((target("neon"))) int64x2_t vornq_s64(int64x2_t __p0, int64x2_t __p1) {
  20720   int64x2_t __ret;
  20721   __ret = __p0 | ~__p1;
  20722   return __ret;
  20723 }
  20724 #else
  20725 __ai __attribute__((target("neon"))) int64x2_t vornq_s64(int64x2_t __p0, int64x2_t __p1) {
  20726   int64x2_t __ret;
  20727   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20728   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20729   __ret = __rev0 | ~__rev1;
  20730   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20731   return __ret;
  20732 }
  20733 #endif
  20734 
  20735 #ifdef __LITTLE_ENDIAN__
  20736 __ai __attribute__((target("neon"))) int16x8_t vornq_s16(int16x8_t __p0, int16x8_t __p1) {
  20737   int16x8_t __ret;
  20738   __ret = __p0 | ~__p1;
  20739   return __ret;
  20740 }
  20741 #else
  20742 __ai __attribute__((target("neon"))) int16x8_t vornq_s16(int16x8_t __p0, int16x8_t __p1) {
  20743   int16x8_t __ret;
  20744   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20745   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20746   __ret = __rev0 | ~__rev1;
  20747   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20748   return __ret;
  20749 }
  20750 #endif
  20751 
  20752 #ifdef __LITTLE_ENDIAN__
  20753 __ai __attribute__((target("neon"))) uint8x8_t vorn_u8(uint8x8_t __p0, uint8x8_t __p1) {
  20754   uint8x8_t __ret;
  20755   __ret = __p0 | ~__p1;
  20756   return __ret;
  20757 }
  20758 #else
  20759 __ai __attribute__((target("neon"))) uint8x8_t vorn_u8(uint8x8_t __p0, uint8x8_t __p1) {
  20760   uint8x8_t __ret;
  20761   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20762   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20763   __ret = __rev0 | ~__rev1;
  20764   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20765   return __ret;
  20766 }
  20767 #endif
  20768 
  20769 #ifdef __LITTLE_ENDIAN__
  20770 __ai __attribute__((target("neon"))) uint32x2_t vorn_u32(uint32x2_t __p0, uint32x2_t __p1) {
  20771   uint32x2_t __ret;
  20772   __ret = __p0 | ~__p1;
  20773   return __ret;
  20774 }
  20775 #else
  20776 __ai __attribute__((target("neon"))) uint32x2_t vorn_u32(uint32x2_t __p0, uint32x2_t __p1) {
  20777   uint32x2_t __ret;
  20778   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20779   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20780   __ret = __rev0 | ~__rev1;
  20781   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20782   return __ret;
  20783 }
  20784 #endif
  20785 
  20786 __ai __attribute__((target("neon"))) uint64x1_t vorn_u64(uint64x1_t __p0, uint64x1_t __p1) {
  20787   uint64x1_t __ret;
  20788   __ret = __p0 | ~__p1;
  20789   return __ret;
  20790 }
  20791 #ifdef __LITTLE_ENDIAN__
  20792 __ai __attribute__((target("neon"))) uint16x4_t vorn_u16(uint16x4_t __p0, uint16x4_t __p1) {
  20793   uint16x4_t __ret;
  20794   __ret = __p0 | ~__p1;
  20795   return __ret;
  20796 }
  20797 #else
  20798 __ai __attribute__((target("neon"))) uint16x4_t vorn_u16(uint16x4_t __p0, uint16x4_t __p1) {
  20799   uint16x4_t __ret;
  20800   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20801   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20802   __ret = __rev0 | ~__rev1;
  20803   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20804   return __ret;
  20805 }
  20806 #endif
  20807 
  20808 #ifdef __LITTLE_ENDIAN__
  20809 __ai __attribute__((target("neon"))) int8x8_t vorn_s8(int8x8_t __p0, int8x8_t __p1) {
  20810   int8x8_t __ret;
  20811   __ret = __p0 | ~__p1;
  20812   return __ret;
  20813 }
  20814 #else
  20815 __ai __attribute__((target("neon"))) int8x8_t vorn_s8(int8x8_t __p0, int8x8_t __p1) {
  20816   int8x8_t __ret;
  20817   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20818   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20819   __ret = __rev0 | ~__rev1;
  20820   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20821   return __ret;
  20822 }
  20823 #endif
  20824 
  20825 #ifdef __LITTLE_ENDIAN__
  20826 __ai __attribute__((target("neon"))) int32x2_t vorn_s32(int32x2_t __p0, int32x2_t __p1) {
  20827   int32x2_t __ret;
  20828   __ret = __p0 | ~__p1;
  20829   return __ret;
  20830 }
  20831 #else
  20832 __ai __attribute__((target("neon"))) int32x2_t vorn_s32(int32x2_t __p0, int32x2_t __p1) {
  20833   int32x2_t __ret;
  20834   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20835   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20836   __ret = __rev0 | ~__rev1;
  20837   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20838   return __ret;
  20839 }
  20840 #endif
  20841 
  20842 __ai __attribute__((target("neon"))) int64x1_t vorn_s64(int64x1_t __p0, int64x1_t __p1) {
  20843   int64x1_t __ret;
  20844   __ret = __p0 | ~__p1;
  20845   return __ret;
  20846 }
  20847 #ifdef __LITTLE_ENDIAN__
  20848 __ai __attribute__((target("neon"))) int16x4_t vorn_s16(int16x4_t __p0, int16x4_t __p1) {
  20849   int16x4_t __ret;
  20850   __ret = __p0 | ~__p1;
  20851   return __ret;
  20852 }
  20853 #else
  20854 __ai __attribute__((target("neon"))) int16x4_t vorn_s16(int16x4_t __p0, int16x4_t __p1) {
  20855   int16x4_t __ret;
  20856   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20857   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20858   __ret = __rev0 | ~__rev1;
  20859   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20860   return __ret;
  20861 }
  20862 #endif
  20863 
  20864 #ifdef __LITTLE_ENDIAN__
  20865 __ai __attribute__((target("neon"))) uint8x16_t vorrq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  20866   uint8x16_t __ret;
  20867   __ret = __p0 | __p1;
  20868   return __ret;
  20869 }
  20870 #else
  20871 __ai __attribute__((target("neon"))) uint8x16_t vorrq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  20872   uint8x16_t __ret;
  20873   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20874   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20875   __ret = __rev0 | __rev1;
  20876   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20877   return __ret;
  20878 }
  20879 #endif
  20880 
  20881 #ifdef __LITTLE_ENDIAN__
  20882 __ai __attribute__((target("neon"))) uint32x4_t vorrq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  20883   uint32x4_t __ret;
  20884   __ret = __p0 | __p1;
  20885   return __ret;
  20886 }
  20887 #else
  20888 __ai __attribute__((target("neon"))) uint32x4_t vorrq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  20889   uint32x4_t __ret;
  20890   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20891   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20892   __ret = __rev0 | __rev1;
  20893   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20894   return __ret;
  20895 }
  20896 #endif
  20897 
  20898 #ifdef __LITTLE_ENDIAN__
  20899 __ai __attribute__((target("neon"))) uint64x2_t vorrq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  20900   uint64x2_t __ret;
  20901   __ret = __p0 | __p1;
  20902   return __ret;
  20903 }
  20904 #else
  20905 __ai __attribute__((target("neon"))) uint64x2_t vorrq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  20906   uint64x2_t __ret;
  20907   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20908   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20909   __ret = __rev0 | __rev1;
  20910   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20911   return __ret;
  20912 }
  20913 #endif
  20914 
  20915 #ifdef __LITTLE_ENDIAN__
  20916 __ai __attribute__((target("neon"))) uint16x8_t vorrq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  20917   uint16x8_t __ret;
  20918   __ret = __p0 | __p1;
  20919   return __ret;
  20920 }
  20921 #else
  20922 __ai __attribute__((target("neon"))) uint16x8_t vorrq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  20923   uint16x8_t __ret;
  20924   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20925   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20926   __ret = __rev0 | __rev1;
  20927   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20928   return __ret;
  20929 }
  20930 #endif
  20931 
  20932 #ifdef __LITTLE_ENDIAN__
  20933 __ai __attribute__((target("neon"))) int8x16_t vorrq_s8(int8x16_t __p0, int8x16_t __p1) {
  20934   int8x16_t __ret;
  20935   __ret = __p0 | __p1;
  20936   return __ret;
  20937 }
  20938 #else
  20939 __ai __attribute__((target("neon"))) int8x16_t vorrq_s8(int8x16_t __p0, int8x16_t __p1) {
  20940   int8x16_t __ret;
  20941   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20942   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20943   __ret = __rev0 | __rev1;
  20944   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  20945   return __ret;
  20946 }
  20947 #endif
  20948 
  20949 #ifdef __LITTLE_ENDIAN__
  20950 __ai __attribute__((target("neon"))) int32x4_t vorrq_s32(int32x4_t __p0, int32x4_t __p1) {
  20951   int32x4_t __ret;
  20952   __ret = __p0 | __p1;
  20953   return __ret;
  20954 }
  20955 #else
  20956 __ai __attribute__((target("neon"))) int32x4_t vorrq_s32(int32x4_t __p0, int32x4_t __p1) {
  20957   int32x4_t __ret;
  20958   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  20959   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  20960   __ret = __rev0 | __rev1;
  20961   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  20962   return __ret;
  20963 }
  20964 #endif
  20965 
  20966 #ifdef __LITTLE_ENDIAN__
  20967 __ai __attribute__((target("neon"))) int64x2_t vorrq_s64(int64x2_t __p0, int64x2_t __p1) {
  20968   int64x2_t __ret;
  20969   __ret = __p0 | __p1;
  20970   return __ret;
  20971 }
  20972 #else
  20973 __ai __attribute__((target("neon"))) int64x2_t vorrq_s64(int64x2_t __p0, int64x2_t __p1) {
  20974   int64x2_t __ret;
  20975   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  20976   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  20977   __ret = __rev0 | __rev1;
  20978   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  20979   return __ret;
  20980 }
  20981 #endif
  20982 
  20983 #ifdef __LITTLE_ENDIAN__
  20984 __ai __attribute__((target("neon"))) int16x8_t vorrq_s16(int16x8_t __p0, int16x8_t __p1) {
  20985   int16x8_t __ret;
  20986   __ret = __p0 | __p1;
  20987   return __ret;
  20988 }
  20989 #else
  20990 __ai __attribute__((target("neon"))) int16x8_t vorrq_s16(int16x8_t __p0, int16x8_t __p1) {
  20991   int16x8_t __ret;
  20992   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  20993   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  20994   __ret = __rev0 | __rev1;
  20995   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  20996   return __ret;
  20997 }
  20998 #endif
  20999 
  21000 #ifdef __LITTLE_ENDIAN__
  21001 __ai __attribute__((target("neon"))) uint8x8_t vorr_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21002   uint8x8_t __ret;
  21003   __ret = __p0 | __p1;
  21004   return __ret;
  21005 }
  21006 #else
  21007 __ai __attribute__((target("neon"))) uint8x8_t vorr_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21008   uint8x8_t __ret;
  21009   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21010   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21011   __ret = __rev0 | __rev1;
  21012   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21013   return __ret;
  21014 }
  21015 #endif
  21016 
  21017 #ifdef __LITTLE_ENDIAN__
  21018 __ai __attribute__((target("neon"))) uint32x2_t vorr_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21019   uint32x2_t __ret;
  21020   __ret = __p0 | __p1;
  21021   return __ret;
  21022 }
  21023 #else
  21024 __ai __attribute__((target("neon"))) uint32x2_t vorr_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21025   uint32x2_t __ret;
  21026   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21027   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21028   __ret = __rev0 | __rev1;
  21029   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21030   return __ret;
  21031 }
  21032 #endif
  21033 
  21034 __ai __attribute__((target("neon"))) uint64x1_t vorr_u64(uint64x1_t __p0, uint64x1_t __p1) {
  21035   uint64x1_t __ret;
  21036   __ret = __p0 | __p1;
  21037   return __ret;
  21038 }
  21039 #ifdef __LITTLE_ENDIAN__
  21040 __ai __attribute__((target("neon"))) uint16x4_t vorr_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21041   uint16x4_t __ret;
  21042   __ret = __p0 | __p1;
  21043   return __ret;
  21044 }
  21045 #else
  21046 __ai __attribute__((target("neon"))) uint16x4_t vorr_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21047   uint16x4_t __ret;
  21048   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21049   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21050   __ret = __rev0 | __rev1;
  21051   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21052   return __ret;
  21053 }
  21054 #endif
  21055 
  21056 #ifdef __LITTLE_ENDIAN__
  21057 __ai __attribute__((target("neon"))) int8x8_t vorr_s8(int8x8_t __p0, int8x8_t __p1) {
  21058   int8x8_t __ret;
  21059   __ret = __p0 | __p1;
  21060   return __ret;
  21061 }
  21062 #else
  21063 __ai __attribute__((target("neon"))) int8x8_t vorr_s8(int8x8_t __p0, int8x8_t __p1) {
  21064   int8x8_t __ret;
  21065   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21066   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21067   __ret = __rev0 | __rev1;
  21068   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21069   return __ret;
  21070 }
  21071 #endif
  21072 
  21073 #ifdef __LITTLE_ENDIAN__
  21074 __ai __attribute__((target("neon"))) int32x2_t vorr_s32(int32x2_t __p0, int32x2_t __p1) {
  21075   int32x2_t __ret;
  21076   __ret = __p0 | __p1;
  21077   return __ret;
  21078 }
  21079 #else
  21080 __ai __attribute__((target("neon"))) int32x2_t vorr_s32(int32x2_t __p0, int32x2_t __p1) {
  21081   int32x2_t __ret;
  21082   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21083   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21084   __ret = __rev0 | __rev1;
  21085   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21086   return __ret;
  21087 }
  21088 #endif
  21089 
  21090 __ai __attribute__((target("neon"))) int64x1_t vorr_s64(int64x1_t __p0, int64x1_t __p1) {
  21091   int64x1_t __ret;
  21092   __ret = __p0 | __p1;
  21093   return __ret;
  21094 }
  21095 #ifdef __LITTLE_ENDIAN__
  21096 __ai __attribute__((target("neon"))) int16x4_t vorr_s16(int16x4_t __p0, int16x4_t __p1) {
  21097   int16x4_t __ret;
  21098   __ret = __p0 | __p1;
  21099   return __ret;
  21100 }
  21101 #else
  21102 __ai __attribute__((target("neon"))) int16x4_t vorr_s16(int16x4_t __p0, int16x4_t __p1) {
  21103   int16x4_t __ret;
  21104   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21105   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21106   __ret = __rev0 | __rev1;
  21107   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21108   return __ret;
  21109 }
  21110 #endif
  21111 
  21112 #ifdef __LITTLE_ENDIAN__
  21113 __ai __attribute__((target("neon"))) uint16x8_t vpadalq_u8(uint16x8_t __p0, uint8x16_t __p1) {
  21114   uint16x8_t __ret;
  21115   __ret = (uint16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  21116   return __ret;
  21117 }
  21118 #else
  21119 __ai __attribute__((target("neon"))) uint16x8_t vpadalq_u8(uint16x8_t __p0, uint8x16_t __p1) {
  21120   uint16x8_t __ret;
  21121   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21122   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21123   __ret = (uint16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  21124   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21125   return __ret;
  21126 }
  21127 #endif
  21128 
  21129 #ifdef __LITTLE_ENDIAN__
  21130 __ai __attribute__((target("neon"))) uint64x2_t vpadalq_u32(uint64x2_t __p0, uint32x4_t __p1) {
  21131   uint64x2_t __ret;
  21132   __ret = (uint64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  21133   return __ret;
  21134 }
  21135 #else
  21136 __ai __attribute__((target("neon"))) uint64x2_t vpadalq_u32(uint64x2_t __p0, uint32x4_t __p1) {
  21137   uint64x2_t __ret;
  21138   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21139   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21140   __ret = (uint64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  21141   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21142   return __ret;
  21143 }
  21144 #endif
  21145 
  21146 #ifdef __LITTLE_ENDIAN__
  21147 __ai __attribute__((target("neon"))) uint32x4_t vpadalq_u16(uint32x4_t __p0, uint16x8_t __p1) {
  21148   uint32x4_t __ret;
  21149   __ret = (uint32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  21150   return __ret;
  21151 }
  21152 #else
  21153 __ai __attribute__((target("neon"))) uint32x4_t vpadalq_u16(uint32x4_t __p0, uint16x8_t __p1) {
  21154   uint32x4_t __ret;
  21155   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21156   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21157   __ret = (uint32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  21158   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21159   return __ret;
  21160 }
  21161 #endif
  21162 
  21163 #ifdef __LITTLE_ENDIAN__
  21164 __ai __attribute__((target("neon"))) int16x8_t vpadalq_s8(int16x8_t __p0, int8x16_t __p1) {
  21165   int16x8_t __ret;
  21166   __ret = (int16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  21167   return __ret;
  21168 }
  21169 #else
  21170 __ai __attribute__((target("neon"))) int16x8_t vpadalq_s8(int16x8_t __p0, int8x16_t __p1) {
  21171   int16x8_t __ret;
  21172   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21173   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21174   __ret = (int16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  21175   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21176   return __ret;
  21177 }
  21178 #endif
  21179 
  21180 #ifdef __LITTLE_ENDIAN__
  21181 __ai __attribute__((target("neon"))) int64x2_t vpadalq_s32(int64x2_t __p0, int32x4_t __p1) {
  21182   int64x2_t __ret;
  21183   __ret = (int64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  21184   return __ret;
  21185 }
  21186 #else
  21187 __ai __attribute__((target("neon"))) int64x2_t vpadalq_s32(int64x2_t __p0, int32x4_t __p1) {
  21188   int64x2_t __ret;
  21189   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21190   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21191   __ret = (int64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  21192   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21193   return __ret;
  21194 }
  21195 #endif
  21196 
  21197 #ifdef __LITTLE_ENDIAN__
  21198 __ai __attribute__((target("neon"))) int32x4_t vpadalq_s16(int32x4_t __p0, int16x8_t __p1) {
  21199   int32x4_t __ret;
  21200   __ret = (int32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  21201   return __ret;
  21202 }
  21203 #else
  21204 __ai __attribute__((target("neon"))) int32x4_t vpadalq_s16(int32x4_t __p0, int16x8_t __p1) {
  21205   int32x4_t __ret;
  21206   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21207   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21208   __ret = (int32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  21209   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21210   return __ret;
  21211 }
  21212 #endif
  21213 
  21214 #ifdef __LITTLE_ENDIAN__
  21215 __ai __attribute__((target("neon"))) uint16x4_t vpadal_u8(uint16x4_t __p0, uint8x8_t __p1) {
  21216   uint16x4_t __ret;
  21217   __ret = (uint16x4_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  21218   return __ret;
  21219 }
  21220 #else
  21221 __ai __attribute__((target("neon"))) uint16x4_t vpadal_u8(uint16x4_t __p0, uint8x8_t __p1) {
  21222   uint16x4_t __ret;
  21223   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21224   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21225   __ret = (uint16x4_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  21226   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21227   return __ret;
  21228 }
  21229 #endif
  21230 
  21231 #ifdef __LITTLE_ENDIAN__
  21232 __ai __attribute__((target("neon"))) uint64x1_t vpadal_u32(uint64x1_t __p0, uint32x2_t __p1) {
  21233   uint64x1_t __ret;
  21234   __ret = (uint64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  21235   return __ret;
  21236 }
  21237 #else
  21238 __ai __attribute__((target("neon"))) uint64x1_t vpadal_u32(uint64x1_t __p0, uint32x2_t __p1) {
  21239   uint64x1_t __ret;
  21240   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21241   __ret = (uint64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__rev1, 19);
  21242   return __ret;
  21243 }
  21244 #endif
  21245 
  21246 #ifdef __LITTLE_ENDIAN__
  21247 __ai __attribute__((target("neon"))) uint32x2_t vpadal_u16(uint32x2_t __p0, uint16x4_t __p1) {
  21248   uint32x2_t __ret;
  21249   __ret = (uint32x2_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  21250   return __ret;
  21251 }
  21252 #else
  21253 __ai __attribute__((target("neon"))) uint32x2_t vpadal_u16(uint32x2_t __p0, uint16x4_t __p1) {
  21254   uint32x2_t __ret;
  21255   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21256   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21257   __ret = (uint32x2_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  21258   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21259   return __ret;
  21260 }
  21261 #endif
  21262 
  21263 #ifdef __LITTLE_ENDIAN__
  21264 __ai __attribute__((target("neon"))) int16x4_t vpadal_s8(int16x4_t __p0, int8x8_t __p1) {
  21265   int16x4_t __ret;
  21266   __ret = (int16x4_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  21267   return __ret;
  21268 }
  21269 #else
  21270 __ai __attribute__((target("neon"))) int16x4_t vpadal_s8(int16x4_t __p0, int8x8_t __p1) {
  21271   int16x4_t __ret;
  21272   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21273   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21274   __ret = (int16x4_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  21275   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21276   return __ret;
  21277 }
  21278 #endif
  21279 
  21280 #ifdef __LITTLE_ENDIAN__
  21281 __ai __attribute__((target("neon"))) int64x1_t vpadal_s32(int64x1_t __p0, int32x2_t __p1) {
  21282   int64x1_t __ret;
  21283   __ret = (int64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  21284   return __ret;
  21285 }
  21286 #else
  21287 __ai __attribute__((target("neon"))) int64x1_t vpadal_s32(int64x1_t __p0, int32x2_t __p1) {
  21288   int64x1_t __ret;
  21289   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21290   __ret = (int64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__rev1, 3);
  21291   return __ret;
  21292 }
  21293 #endif
  21294 
  21295 #ifdef __LITTLE_ENDIAN__
  21296 __ai __attribute__((target("neon"))) int32x2_t vpadal_s16(int32x2_t __p0, int16x4_t __p1) {
  21297   int32x2_t __ret;
  21298   __ret = (int32x2_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  21299   return __ret;
  21300 }
  21301 #else
  21302 __ai __attribute__((target("neon"))) int32x2_t vpadal_s16(int32x2_t __p0, int16x4_t __p1) {
  21303   int32x2_t __ret;
  21304   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21305   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21306   __ret = (int32x2_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  21307   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21308   return __ret;
  21309 }
  21310 #endif
  21311 
  21312 #ifdef __LITTLE_ENDIAN__
  21313 __ai __attribute__((target("neon"))) uint8x8_t vpadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21314   uint8x8_t __ret;
  21315   __ret = (uint8x8_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  21316   return __ret;
  21317 }
  21318 #else
  21319 __ai __attribute__((target("neon"))) uint8x8_t vpadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21320   uint8x8_t __ret;
  21321   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21322   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21323   __ret = (uint8x8_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  21324   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21325   return __ret;
  21326 }
  21327 #endif
  21328 
  21329 #ifdef __LITTLE_ENDIAN__
  21330 __ai __attribute__((target("neon"))) uint32x2_t vpadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21331   uint32x2_t __ret;
  21332   __ret = (uint32x2_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  21333   return __ret;
  21334 }
  21335 #else
  21336 __ai __attribute__((target("neon"))) uint32x2_t vpadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21337   uint32x2_t __ret;
  21338   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21339   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21340   __ret = (uint32x2_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  21341   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21342   return __ret;
  21343 }
  21344 #endif
  21345 
  21346 #ifdef __LITTLE_ENDIAN__
  21347 __ai __attribute__((target("neon"))) uint16x4_t vpadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21348   uint16x4_t __ret;
  21349   __ret = (uint16x4_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  21350   return __ret;
  21351 }
  21352 #else
  21353 __ai __attribute__((target("neon"))) uint16x4_t vpadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21354   uint16x4_t __ret;
  21355   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21356   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21357   __ret = (uint16x4_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  21358   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21359   return __ret;
  21360 }
  21361 #endif
  21362 
  21363 #ifdef __LITTLE_ENDIAN__
  21364 __ai __attribute__((target("neon"))) int8x8_t vpadd_s8(int8x8_t __p0, int8x8_t __p1) {
  21365   int8x8_t __ret;
  21366   __ret = (int8x8_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  21367   return __ret;
  21368 }
  21369 #else
  21370 __ai __attribute__((target("neon"))) int8x8_t vpadd_s8(int8x8_t __p0, int8x8_t __p1) {
  21371   int8x8_t __ret;
  21372   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21373   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21374   __ret = (int8x8_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  21375   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21376   return __ret;
  21377 }
  21378 #endif
  21379 
  21380 #ifdef __LITTLE_ENDIAN__
  21381 __ai __attribute__((target("neon"))) float32x2_t vpadd_f32(float32x2_t __p0, float32x2_t __p1) {
  21382   float32x2_t __ret;
  21383   __ret = (float32x2_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  21384   return __ret;
  21385 }
  21386 #else
  21387 __ai __attribute__((target("neon"))) float32x2_t vpadd_f32(float32x2_t __p0, float32x2_t __p1) {
  21388   float32x2_t __ret;
  21389   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21390   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21391   __ret = (float32x2_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  21392   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21393   return __ret;
  21394 }
  21395 #endif
  21396 
  21397 #ifdef __LITTLE_ENDIAN__
  21398 __ai __attribute__((target("neon"))) int32x2_t vpadd_s32(int32x2_t __p0, int32x2_t __p1) {
  21399   int32x2_t __ret;
  21400   __ret = (int32x2_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  21401   return __ret;
  21402 }
  21403 #else
  21404 __ai __attribute__((target("neon"))) int32x2_t vpadd_s32(int32x2_t __p0, int32x2_t __p1) {
  21405   int32x2_t __ret;
  21406   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21407   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21408   __ret = (int32x2_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  21409   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21410   return __ret;
  21411 }
  21412 #endif
  21413 
  21414 #ifdef __LITTLE_ENDIAN__
  21415 __ai __attribute__((target("neon"))) int16x4_t vpadd_s16(int16x4_t __p0, int16x4_t __p1) {
  21416   int16x4_t __ret;
  21417   __ret = (int16x4_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  21418   return __ret;
  21419 }
  21420 #else
  21421 __ai __attribute__((target("neon"))) int16x4_t vpadd_s16(int16x4_t __p0, int16x4_t __p1) {
  21422   int16x4_t __ret;
  21423   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21424   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21425   __ret = (int16x4_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  21426   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21427   return __ret;
  21428 }
  21429 #endif
  21430 
  21431 #ifdef __LITTLE_ENDIAN__
  21432 __ai __attribute__((target("neon"))) uint16x8_t vpaddlq_u8(uint8x16_t __p0) {
  21433   uint16x8_t __ret;
  21434   __ret = (uint16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 49);
  21435   return __ret;
  21436 }
  21437 #else
  21438 __ai __attribute__((target("neon"))) uint16x8_t vpaddlq_u8(uint8x16_t __p0) {
  21439   uint16x8_t __ret;
  21440   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21441   __ret = (uint16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 49);
  21442   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21443   return __ret;
  21444 }
  21445 #endif
  21446 
  21447 #ifdef __LITTLE_ENDIAN__
  21448 __ai __attribute__((target("neon"))) uint64x2_t vpaddlq_u32(uint32x4_t __p0) {
  21449   uint64x2_t __ret;
  21450   __ret = (uint64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 51);
  21451   return __ret;
  21452 }
  21453 #else
  21454 __ai __attribute__((target("neon"))) uint64x2_t vpaddlq_u32(uint32x4_t __p0) {
  21455   uint64x2_t __ret;
  21456   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21457   __ret = (uint64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 51);
  21458   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21459   return __ret;
  21460 }
  21461 #endif
  21462 
  21463 #ifdef __LITTLE_ENDIAN__
  21464 __ai __attribute__((target("neon"))) uint32x4_t vpaddlq_u16(uint16x8_t __p0) {
  21465   uint32x4_t __ret;
  21466   __ret = (uint32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 50);
  21467   return __ret;
  21468 }
  21469 #else
  21470 __ai __attribute__((target("neon"))) uint32x4_t vpaddlq_u16(uint16x8_t __p0) {
  21471   uint32x4_t __ret;
  21472   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21473   __ret = (uint32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 50);
  21474   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21475   return __ret;
  21476 }
  21477 #endif
  21478 
  21479 #ifdef __LITTLE_ENDIAN__
  21480 __ai __attribute__((target("neon"))) int16x8_t vpaddlq_s8(int8x16_t __p0) {
  21481   int16x8_t __ret;
  21482   __ret = (int16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 33);
  21483   return __ret;
  21484 }
  21485 #else
  21486 __ai __attribute__((target("neon"))) int16x8_t vpaddlq_s8(int8x16_t __p0) {
  21487   int16x8_t __ret;
  21488   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21489   __ret = (int16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 33);
  21490   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21491   return __ret;
  21492 }
  21493 #endif
  21494 
  21495 #ifdef __LITTLE_ENDIAN__
  21496 __ai __attribute__((target("neon"))) int64x2_t vpaddlq_s32(int32x4_t __p0) {
  21497   int64x2_t __ret;
  21498   __ret = (int64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 35);
  21499   return __ret;
  21500 }
  21501 #else
  21502 __ai __attribute__((target("neon"))) int64x2_t vpaddlq_s32(int32x4_t __p0) {
  21503   int64x2_t __ret;
  21504   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21505   __ret = (int64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 35);
  21506   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21507   return __ret;
  21508 }
  21509 #endif
  21510 
  21511 #ifdef __LITTLE_ENDIAN__
  21512 __ai __attribute__((target("neon"))) int32x4_t vpaddlq_s16(int16x8_t __p0) {
  21513   int32x4_t __ret;
  21514   __ret = (int32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 34);
  21515   return __ret;
  21516 }
  21517 #else
  21518 __ai __attribute__((target("neon"))) int32x4_t vpaddlq_s16(int16x8_t __p0) {
  21519   int32x4_t __ret;
  21520   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21521   __ret = (int32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 34);
  21522   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21523   return __ret;
  21524 }
  21525 #endif
  21526 
  21527 #ifdef __LITTLE_ENDIAN__
  21528 __ai __attribute__((target("neon"))) uint16x4_t vpaddl_u8(uint8x8_t __p0) {
  21529   uint16x4_t __ret;
  21530   __ret = (uint16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 17);
  21531   return __ret;
  21532 }
  21533 #else
  21534 __ai __attribute__((target("neon"))) uint16x4_t vpaddl_u8(uint8x8_t __p0) {
  21535   uint16x4_t __ret;
  21536   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21537   __ret = (uint16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 17);
  21538   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21539   return __ret;
  21540 }
  21541 #endif
  21542 
  21543 #ifdef __LITTLE_ENDIAN__
  21544 __ai __attribute__((target("neon"))) uint64x1_t vpaddl_u32(uint32x2_t __p0) {
  21545   uint64x1_t __ret;
  21546   __ret = (uint64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 19);
  21547   return __ret;
  21548 }
  21549 #else
  21550 __ai __attribute__((target("neon"))) uint64x1_t vpaddl_u32(uint32x2_t __p0) {
  21551   uint64x1_t __ret;
  21552   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21553   __ret = (uint64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 19);
  21554   return __ret;
  21555 }
  21556 #endif
  21557 
  21558 #ifdef __LITTLE_ENDIAN__
  21559 __ai __attribute__((target("neon"))) uint32x2_t vpaddl_u16(uint16x4_t __p0) {
  21560   uint32x2_t __ret;
  21561   __ret = (uint32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 18);
  21562   return __ret;
  21563 }
  21564 #else
  21565 __ai __attribute__((target("neon"))) uint32x2_t vpaddl_u16(uint16x4_t __p0) {
  21566   uint32x2_t __ret;
  21567   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21568   __ret = (uint32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 18);
  21569   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21570   return __ret;
  21571 }
  21572 #endif
  21573 
  21574 #ifdef __LITTLE_ENDIAN__
  21575 __ai __attribute__((target("neon"))) int16x4_t vpaddl_s8(int8x8_t __p0) {
  21576   int16x4_t __ret;
  21577   __ret = (int16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 1);
  21578   return __ret;
  21579 }
  21580 #else
  21581 __ai __attribute__((target("neon"))) int16x4_t vpaddl_s8(int8x8_t __p0) {
  21582   int16x4_t __ret;
  21583   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21584   __ret = (int16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 1);
  21585   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21586   return __ret;
  21587 }
  21588 #endif
  21589 
  21590 #ifdef __LITTLE_ENDIAN__
  21591 __ai __attribute__((target("neon"))) int64x1_t vpaddl_s32(int32x2_t __p0) {
  21592   int64x1_t __ret;
  21593   __ret = (int64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 3);
  21594   return __ret;
  21595 }
  21596 #else
  21597 __ai __attribute__((target("neon"))) int64x1_t vpaddl_s32(int32x2_t __p0) {
  21598   int64x1_t __ret;
  21599   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21600   __ret = (int64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 3);
  21601   return __ret;
  21602 }
  21603 #endif
  21604 
  21605 #ifdef __LITTLE_ENDIAN__
  21606 __ai __attribute__((target("neon"))) int32x2_t vpaddl_s16(int16x4_t __p0) {
  21607   int32x2_t __ret;
  21608   __ret = (int32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 2);
  21609   return __ret;
  21610 }
  21611 #else
  21612 __ai __attribute__((target("neon"))) int32x2_t vpaddl_s16(int16x4_t __p0) {
  21613   int32x2_t __ret;
  21614   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21615   __ret = (int32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 2);
  21616   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21617   return __ret;
  21618 }
  21619 #endif
  21620 
  21621 #ifdef __LITTLE_ENDIAN__
  21622 __ai __attribute__((target("neon"))) uint8x8_t vpmax_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21623   uint8x8_t __ret;
  21624   __ret = (uint8x8_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  21625   return __ret;
  21626 }
  21627 #else
  21628 __ai __attribute__((target("neon"))) uint8x8_t vpmax_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21629   uint8x8_t __ret;
  21630   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21631   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21632   __ret = (uint8x8_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  21633   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21634   return __ret;
  21635 }
  21636 #endif
  21637 
  21638 #ifdef __LITTLE_ENDIAN__
  21639 __ai __attribute__((target("neon"))) uint32x2_t vpmax_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21640   uint32x2_t __ret;
  21641   __ret = (uint32x2_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  21642   return __ret;
  21643 }
  21644 #else
  21645 __ai __attribute__((target("neon"))) uint32x2_t vpmax_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21646   uint32x2_t __ret;
  21647   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21648   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21649   __ret = (uint32x2_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  21650   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21651   return __ret;
  21652 }
  21653 #endif
  21654 
  21655 #ifdef __LITTLE_ENDIAN__
  21656 __ai __attribute__((target("neon"))) uint16x4_t vpmax_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21657   uint16x4_t __ret;
  21658   __ret = (uint16x4_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  21659   return __ret;
  21660 }
  21661 #else
  21662 __ai __attribute__((target("neon"))) uint16x4_t vpmax_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21663   uint16x4_t __ret;
  21664   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21665   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21666   __ret = (uint16x4_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  21667   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21668   return __ret;
  21669 }
  21670 #endif
  21671 
  21672 #ifdef __LITTLE_ENDIAN__
  21673 __ai __attribute__((target("neon"))) int8x8_t vpmax_s8(int8x8_t __p0, int8x8_t __p1) {
  21674   int8x8_t __ret;
  21675   __ret = (int8x8_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  21676   return __ret;
  21677 }
  21678 #else
  21679 __ai __attribute__((target("neon"))) int8x8_t vpmax_s8(int8x8_t __p0, int8x8_t __p1) {
  21680   int8x8_t __ret;
  21681   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21682   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21683   __ret = (int8x8_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  21684   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21685   return __ret;
  21686 }
  21687 #endif
  21688 
  21689 #ifdef __LITTLE_ENDIAN__
  21690 __ai __attribute__((target("neon"))) float32x2_t vpmax_f32(float32x2_t __p0, float32x2_t __p1) {
  21691   float32x2_t __ret;
  21692   __ret = (float32x2_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  21693   return __ret;
  21694 }
  21695 #else
  21696 __ai __attribute__((target("neon"))) float32x2_t vpmax_f32(float32x2_t __p0, float32x2_t __p1) {
  21697   float32x2_t __ret;
  21698   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21699   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21700   __ret = (float32x2_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  21701   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21702   return __ret;
  21703 }
  21704 #endif
  21705 
  21706 #ifdef __LITTLE_ENDIAN__
  21707 __ai __attribute__((target("neon"))) int32x2_t vpmax_s32(int32x2_t __p0, int32x2_t __p1) {
  21708   int32x2_t __ret;
  21709   __ret = (int32x2_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  21710   return __ret;
  21711 }
  21712 #else
  21713 __ai __attribute__((target("neon"))) int32x2_t vpmax_s32(int32x2_t __p0, int32x2_t __p1) {
  21714   int32x2_t __ret;
  21715   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21716   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21717   __ret = (int32x2_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  21718   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21719   return __ret;
  21720 }
  21721 #endif
  21722 
  21723 #ifdef __LITTLE_ENDIAN__
  21724 __ai __attribute__((target("neon"))) int16x4_t vpmax_s16(int16x4_t __p0, int16x4_t __p1) {
  21725   int16x4_t __ret;
  21726   __ret = (int16x4_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  21727   return __ret;
  21728 }
  21729 #else
  21730 __ai __attribute__((target("neon"))) int16x4_t vpmax_s16(int16x4_t __p0, int16x4_t __p1) {
  21731   int16x4_t __ret;
  21732   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21733   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21734   __ret = (int16x4_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  21735   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21736   return __ret;
  21737 }
  21738 #endif
  21739 
  21740 #ifdef __LITTLE_ENDIAN__
  21741 __ai __attribute__((target("neon"))) uint8x8_t vpmin_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21742   uint8x8_t __ret;
  21743   __ret = (uint8x8_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  21744   return __ret;
  21745 }
  21746 #else
  21747 __ai __attribute__((target("neon"))) uint8x8_t vpmin_u8(uint8x8_t __p0, uint8x8_t __p1) {
  21748   uint8x8_t __ret;
  21749   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21750   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21751   __ret = (uint8x8_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  21752   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21753   return __ret;
  21754 }
  21755 #endif
  21756 
  21757 #ifdef __LITTLE_ENDIAN__
  21758 __ai __attribute__((target("neon"))) uint32x2_t vpmin_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21759   uint32x2_t __ret;
  21760   __ret = (uint32x2_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  21761   return __ret;
  21762 }
  21763 #else
  21764 __ai __attribute__((target("neon"))) uint32x2_t vpmin_u32(uint32x2_t __p0, uint32x2_t __p1) {
  21765   uint32x2_t __ret;
  21766   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21767   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21768   __ret = (uint32x2_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  21769   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21770   return __ret;
  21771 }
  21772 #endif
  21773 
  21774 #ifdef __LITTLE_ENDIAN__
  21775 __ai __attribute__((target("neon"))) uint16x4_t vpmin_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21776   uint16x4_t __ret;
  21777   __ret = (uint16x4_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  21778   return __ret;
  21779 }
  21780 #else
  21781 __ai __attribute__((target("neon"))) uint16x4_t vpmin_u16(uint16x4_t __p0, uint16x4_t __p1) {
  21782   uint16x4_t __ret;
  21783   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21784   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21785   __ret = (uint16x4_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  21786   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21787   return __ret;
  21788 }
  21789 #endif
  21790 
  21791 #ifdef __LITTLE_ENDIAN__
  21792 __ai __attribute__((target("neon"))) int8x8_t vpmin_s8(int8x8_t __p0, int8x8_t __p1) {
  21793   int8x8_t __ret;
  21794   __ret = (int8x8_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  21795   return __ret;
  21796 }
  21797 #else
  21798 __ai __attribute__((target("neon"))) int8x8_t vpmin_s8(int8x8_t __p0, int8x8_t __p1) {
  21799   int8x8_t __ret;
  21800   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21801   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  21802   __ret = (int8x8_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  21803   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21804   return __ret;
  21805 }
  21806 #endif
  21807 
  21808 #ifdef __LITTLE_ENDIAN__
  21809 __ai __attribute__((target("neon"))) float32x2_t vpmin_f32(float32x2_t __p0, float32x2_t __p1) {
  21810   float32x2_t __ret;
  21811   __ret = (float32x2_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  21812   return __ret;
  21813 }
  21814 #else
  21815 __ai __attribute__((target("neon"))) float32x2_t vpmin_f32(float32x2_t __p0, float32x2_t __p1) {
  21816   float32x2_t __ret;
  21817   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21818   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21819   __ret = (float32x2_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  21820   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21821   return __ret;
  21822 }
  21823 #endif
  21824 
  21825 #ifdef __LITTLE_ENDIAN__
  21826 __ai __attribute__((target("neon"))) int32x2_t vpmin_s32(int32x2_t __p0, int32x2_t __p1) {
  21827   int32x2_t __ret;
  21828   __ret = (int32x2_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  21829   return __ret;
  21830 }
  21831 #else
  21832 __ai __attribute__((target("neon"))) int32x2_t vpmin_s32(int32x2_t __p0, int32x2_t __p1) {
  21833   int32x2_t __ret;
  21834   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21835   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  21836   __ret = (int32x2_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  21837   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21838   return __ret;
  21839 }
  21840 #endif
  21841 
  21842 #ifdef __LITTLE_ENDIAN__
  21843 __ai __attribute__((target("neon"))) int16x4_t vpmin_s16(int16x4_t __p0, int16x4_t __p1) {
  21844   int16x4_t __ret;
  21845   __ret = (int16x4_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  21846   return __ret;
  21847 }
  21848 #else
  21849 __ai __attribute__((target("neon"))) int16x4_t vpmin_s16(int16x4_t __p0, int16x4_t __p1) {
  21850   int16x4_t __ret;
  21851   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21852   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21853   __ret = (int16x4_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  21854   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21855   return __ret;
  21856 }
  21857 #endif
  21858 
  21859 #ifdef __LITTLE_ENDIAN__
  21860 __ai __attribute__((target("neon"))) int8x16_t vqabsq_s8(int8x16_t __p0) {
  21861   int8x16_t __ret;
  21862   __ret = (int8x16_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 32);
  21863   return __ret;
  21864 }
  21865 #else
  21866 __ai __attribute__((target("neon"))) int8x16_t vqabsq_s8(int8x16_t __p0) {
  21867   int8x16_t __ret;
  21868   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21869   __ret = (int8x16_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 32);
  21870   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21871   return __ret;
  21872 }
  21873 #endif
  21874 
  21875 #ifdef __LITTLE_ENDIAN__
  21876 __ai __attribute__((target("neon"))) int32x4_t vqabsq_s32(int32x4_t __p0) {
  21877   int32x4_t __ret;
  21878   __ret = (int32x4_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 34);
  21879   return __ret;
  21880 }
  21881 #else
  21882 __ai __attribute__((target("neon"))) int32x4_t vqabsq_s32(int32x4_t __p0) {
  21883   int32x4_t __ret;
  21884   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21885   __ret = (int32x4_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 34);
  21886   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21887   return __ret;
  21888 }
  21889 #endif
  21890 
  21891 #ifdef __LITTLE_ENDIAN__
  21892 __ai __attribute__((target("neon"))) int16x8_t vqabsq_s16(int16x8_t __p0) {
  21893   int16x8_t __ret;
  21894   __ret = (int16x8_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 33);
  21895   return __ret;
  21896 }
  21897 #else
  21898 __ai __attribute__((target("neon"))) int16x8_t vqabsq_s16(int16x8_t __p0) {
  21899   int16x8_t __ret;
  21900   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21901   __ret = (int16x8_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 33);
  21902   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21903   return __ret;
  21904 }
  21905 #endif
  21906 
  21907 #ifdef __LITTLE_ENDIAN__
  21908 __ai __attribute__((target("neon"))) int8x8_t vqabs_s8(int8x8_t __p0) {
  21909   int8x8_t __ret;
  21910   __ret = (int8x8_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 0);
  21911   return __ret;
  21912 }
  21913 #else
  21914 __ai __attribute__((target("neon"))) int8x8_t vqabs_s8(int8x8_t __p0) {
  21915   int8x8_t __ret;
  21916   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  21917   __ret = (int8x8_t) __builtin_neon_vqabs_v((int8x8_t)__rev0, 0);
  21918   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  21919   return __ret;
  21920 }
  21921 #endif
  21922 
  21923 #ifdef __LITTLE_ENDIAN__
  21924 __ai __attribute__((target("neon"))) int32x2_t vqabs_s32(int32x2_t __p0) {
  21925   int32x2_t __ret;
  21926   __ret = (int32x2_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 2);
  21927   return __ret;
  21928 }
  21929 #else
  21930 __ai __attribute__((target("neon"))) int32x2_t vqabs_s32(int32x2_t __p0) {
  21931   int32x2_t __ret;
  21932   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21933   __ret = (int32x2_t) __builtin_neon_vqabs_v((int8x8_t)__rev0, 2);
  21934   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  21935   return __ret;
  21936 }
  21937 #endif
  21938 
  21939 #ifdef __LITTLE_ENDIAN__
  21940 __ai __attribute__((target("neon"))) int16x4_t vqabs_s16(int16x4_t __p0) {
  21941   int16x4_t __ret;
  21942   __ret = (int16x4_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 1);
  21943   return __ret;
  21944 }
  21945 #else
  21946 __ai __attribute__((target("neon"))) int16x4_t vqabs_s16(int16x4_t __p0) {
  21947   int16x4_t __ret;
  21948   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21949   __ret = (int16x4_t) __builtin_neon_vqabs_v((int8x8_t)__rev0, 1);
  21950   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21951   return __ret;
  21952 }
  21953 #endif
  21954 
  21955 #ifdef __LITTLE_ENDIAN__
  21956 __ai __attribute__((target("neon"))) uint8x16_t vqaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  21957   uint8x16_t __ret;
  21958   __ret = (uint8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  21959   return __ret;
  21960 }
  21961 #else
  21962 __ai __attribute__((target("neon"))) uint8x16_t vqaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  21963   uint8x16_t __ret;
  21964   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21965   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21966   __ret = (uint8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  21967   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  21968   return __ret;
  21969 }
  21970 #endif
  21971 
  21972 #ifdef __LITTLE_ENDIAN__
  21973 __ai __attribute__((target("neon"))) uint32x4_t vqaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  21974   uint32x4_t __ret;
  21975   __ret = (uint32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  21976   return __ret;
  21977 }
  21978 #else
  21979 __ai __attribute__((target("neon"))) uint32x4_t vqaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  21980   uint32x4_t __ret;
  21981   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  21982   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  21983   __ret = (uint32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  21984   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  21985   return __ret;
  21986 }
  21987 #endif
  21988 
  21989 #ifdef __LITTLE_ENDIAN__
  21990 __ai __attribute__((target("neon"))) uint64x2_t vqaddq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  21991   uint64x2_t __ret;
  21992   __ret = (uint64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  21993   return __ret;
  21994 }
  21995 #else
  21996 __ai __attribute__((target("neon"))) uint64x2_t vqaddq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  21997   uint64x2_t __ret;
  21998   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  21999   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22000   __ret = (uint64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  22001   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22002   return __ret;
  22003 }
  22004 #endif
  22005 
  22006 #ifdef __LITTLE_ENDIAN__
  22007 __ai __attribute__((target("neon"))) uint16x8_t vqaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  22008   uint16x8_t __ret;
  22009   __ret = (uint16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  22010   return __ret;
  22011 }
  22012 #else
  22013 __ai __attribute__((target("neon"))) uint16x8_t vqaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  22014   uint16x8_t __ret;
  22015   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22016   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  22017   __ret = (uint16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  22018   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22019   return __ret;
  22020 }
  22021 #endif
  22022 
  22023 #ifdef __LITTLE_ENDIAN__
  22024 __ai __attribute__((target("neon"))) int8x16_t vqaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  22025   int8x16_t __ret;
  22026   __ret = (int8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  22027   return __ret;
  22028 }
  22029 #else
  22030 __ai __attribute__((target("neon"))) int8x16_t vqaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  22031   int8x16_t __ret;
  22032   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  22033   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  22034   __ret = (int8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  22035   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  22036   return __ret;
  22037 }
  22038 #endif
  22039 
  22040 #ifdef __LITTLE_ENDIAN__
  22041 __ai __attribute__((target("neon"))) int32x4_t vqaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  22042   int32x4_t __ret;
  22043   __ret = (int32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  22044   return __ret;
  22045 }
  22046 #else
  22047 __ai __attribute__((target("neon"))) int32x4_t vqaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  22048   int32x4_t __ret;
  22049   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22050   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22051   __ret = (int32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  22052   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22053   return __ret;
  22054 }
  22055 #endif
  22056 
  22057 #ifdef __LITTLE_ENDIAN__
  22058 __ai __attribute__((target("neon"))) int64x2_t vqaddq_s64(int64x2_t __p0, int64x2_t __p1) {
  22059   int64x2_t __ret;
  22060   __ret = (int64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  22061   return __ret;
  22062 }
  22063 #else
  22064 __ai __attribute__((target("neon"))) int64x2_t vqaddq_s64(int64x2_t __p0, int64x2_t __p1) {
  22065   int64x2_t __ret;
  22066   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22067   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22068   __ret = (int64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  22069   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22070   return __ret;
  22071 }
  22072 #endif
  22073 
  22074 #ifdef __LITTLE_ENDIAN__
  22075 __ai __attribute__((target("neon"))) int16x8_t vqaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  22076   int16x8_t __ret;
  22077   __ret = (int16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  22078   return __ret;
  22079 }
  22080 #else
  22081 __ai __attribute__((target("neon"))) int16x8_t vqaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  22082   int16x8_t __ret;
  22083   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22084   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  22085   __ret = (int16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  22086   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22087   return __ret;
  22088 }
  22089 #endif
  22090 
  22091 #ifdef __LITTLE_ENDIAN__
  22092 __ai __attribute__((target("neon"))) uint8x8_t vqadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  22093   uint8x8_t __ret;
  22094   __ret = (uint8x8_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  22095   return __ret;
  22096 }
  22097 #else
  22098 __ai __attribute__((target("neon"))) uint8x8_t vqadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  22099   uint8x8_t __ret;
  22100   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22101   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  22102   __ret = (uint8x8_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  22103   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22104   return __ret;
  22105 }
  22106 #endif
  22107 
  22108 #ifdef __LITTLE_ENDIAN__
  22109 __ai __attribute__((target("neon"))) uint32x2_t vqadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  22110   uint32x2_t __ret;
  22111   __ret = (uint32x2_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  22112   return __ret;
  22113 }
  22114 #else
  22115 __ai __attribute__((target("neon"))) uint32x2_t vqadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  22116   uint32x2_t __ret;
  22117   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22118   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22119   __ret = (uint32x2_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  22120   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22121   return __ret;
  22122 }
  22123 #endif
  22124 
  22125 __ai __attribute__((target("neon"))) uint64x1_t vqadd_u64(uint64x1_t __p0, uint64x1_t __p1) {
  22126   uint64x1_t __ret;
  22127   __ret = (uint64x1_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  22128   return __ret;
  22129 }
  22130 #ifdef __LITTLE_ENDIAN__
  22131 __ai __attribute__((target("neon"))) uint16x4_t vqadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  22132   uint16x4_t __ret;
  22133   __ret = (uint16x4_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  22134   return __ret;
  22135 }
  22136 #else
  22137 __ai __attribute__((target("neon"))) uint16x4_t vqadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  22138   uint16x4_t __ret;
  22139   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22140   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22141   __ret = (uint16x4_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  22142   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22143   return __ret;
  22144 }
  22145 #endif
  22146 
  22147 #ifdef __LITTLE_ENDIAN__
  22148 __ai __attribute__((target("neon"))) int8x8_t vqadd_s8(int8x8_t __p0, int8x8_t __p1) {
  22149   int8x8_t __ret;
  22150   __ret = (int8x8_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  22151   return __ret;
  22152 }
  22153 #else
  22154 __ai __attribute__((target("neon"))) int8x8_t vqadd_s8(int8x8_t __p0, int8x8_t __p1) {
  22155   int8x8_t __ret;
  22156   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22157   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  22158   __ret = (int8x8_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  22159   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22160   return __ret;
  22161 }
  22162 #endif
  22163 
  22164 #ifdef __LITTLE_ENDIAN__
  22165 __ai __attribute__((target("neon"))) int32x2_t vqadd_s32(int32x2_t __p0, int32x2_t __p1) {
  22166   int32x2_t __ret;
  22167   __ret = (int32x2_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  22168   return __ret;
  22169 }
  22170 #else
  22171 __ai __attribute__((target("neon"))) int32x2_t vqadd_s32(int32x2_t __p0, int32x2_t __p1) {
  22172   int32x2_t __ret;
  22173   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22174   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22175   __ret = (int32x2_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  22176   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22177   return __ret;
  22178 }
  22179 #endif
  22180 
  22181 __ai __attribute__((target("neon"))) int64x1_t vqadd_s64(int64x1_t __p0, int64x1_t __p1) {
  22182   int64x1_t __ret;
  22183   __ret = (int64x1_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  22184   return __ret;
  22185 }
  22186 #ifdef __LITTLE_ENDIAN__
  22187 __ai __attribute__((target("neon"))) int16x4_t vqadd_s16(int16x4_t __p0, int16x4_t __p1) {
  22188   int16x4_t __ret;
  22189   __ret = (int16x4_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  22190   return __ret;
  22191 }
  22192 #else
  22193 __ai __attribute__((target("neon"))) int16x4_t vqadd_s16(int16x4_t __p0, int16x4_t __p1) {
  22194   int16x4_t __ret;
  22195   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22196   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22197   __ret = (int16x4_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  22198   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22199   return __ret;
  22200 }
  22201 #endif
  22202 
  22203 #ifdef __LITTLE_ENDIAN__
  22204 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  22205   int64x2_t __ret;
  22206   __ret = (int64x2_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35);
  22207   return __ret;
  22208 }
  22209 #else
  22210 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  22211   int64x2_t __ret;
  22212   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22213   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22214   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  22215   __ret = (int64x2_t) __builtin_neon_vqdmlal_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 35);
  22216   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22217   return __ret;
  22218 }
  22219 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  22220   int64x2_t __ret;
  22221   __ret = (int64x2_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35);
  22222   return __ret;
  22223 }
  22224 #endif
  22225 
  22226 #ifdef __LITTLE_ENDIAN__
  22227 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  22228   int32x4_t __ret;
  22229   __ret = (int32x4_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34);
  22230   return __ret;
  22231 }
  22232 #else
  22233 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  22234   int32x4_t __ret;
  22235   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22236   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22237   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  22238   __ret = (int32x4_t) __builtin_neon_vqdmlal_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 34);
  22239   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22240   return __ret;
  22241 }
  22242 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  22243   int32x4_t __ret;
  22244   __ret = (int32x4_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34);
  22245   return __ret;
  22246 }
  22247 #endif
  22248 
  22249 #ifdef __LITTLE_ENDIAN__
  22250 #define vqdmlal_lane_s32(__p0_122, __p1_122, __p2_122, __p3_122) __extension__ ({ \
  22251   int64x2_t __ret_122; \
  22252   int64x2_t __s0_122 = __p0_122; \
  22253   int32x2_t __s1_122 = __p1_122; \
  22254   int32x2_t __s2_122 = __p2_122; \
  22255   __ret_122 = vqdmlal_s32(__s0_122, __s1_122, splat_lane_s32(__s2_122, __p3_122)); \
  22256   __ret_122; \
  22257 })
  22258 #else
  22259 #define vqdmlal_lane_s32(__p0_123, __p1_123, __p2_123, __p3_123) __extension__ ({ \
  22260   int64x2_t __ret_123; \
  22261   int64x2_t __s0_123 = __p0_123; \
  22262   int32x2_t __s1_123 = __p1_123; \
  22263   int32x2_t __s2_123 = __p2_123; \
  22264   int64x2_t __rev0_123;  __rev0_123 = __builtin_shufflevector(__s0_123, __s0_123, 1, 0); \
  22265   int32x2_t __rev1_123;  __rev1_123 = __builtin_shufflevector(__s1_123, __s1_123, 1, 0); \
  22266   int32x2_t __rev2_123;  __rev2_123 = __builtin_shufflevector(__s2_123, __s2_123, 1, 0); \
  22267   __ret_123 = __noswap_vqdmlal_s32(__rev0_123, __rev1_123, __noswap_splat_lane_s32(__rev2_123, __p3_123)); \
  22268   __ret_123 = __builtin_shufflevector(__ret_123, __ret_123, 1, 0); \
  22269   __ret_123; \
  22270 })
  22271 #endif
  22272 
  22273 #ifdef __LITTLE_ENDIAN__
  22274 #define vqdmlal_lane_s16(__p0_124, __p1_124, __p2_124, __p3_124) __extension__ ({ \
  22275   int32x4_t __ret_124; \
  22276   int32x4_t __s0_124 = __p0_124; \
  22277   int16x4_t __s1_124 = __p1_124; \
  22278   int16x4_t __s2_124 = __p2_124; \
  22279   __ret_124 = vqdmlal_s16(__s0_124, __s1_124, splat_lane_s16(__s2_124, __p3_124)); \
  22280   __ret_124; \
  22281 })
  22282 #else
  22283 #define vqdmlal_lane_s16(__p0_125, __p1_125, __p2_125, __p3_125) __extension__ ({ \
  22284   int32x4_t __ret_125; \
  22285   int32x4_t __s0_125 = __p0_125; \
  22286   int16x4_t __s1_125 = __p1_125; \
  22287   int16x4_t __s2_125 = __p2_125; \
  22288   int32x4_t __rev0_125;  __rev0_125 = __builtin_shufflevector(__s0_125, __s0_125, 3, 2, 1, 0); \
  22289   int16x4_t __rev1_125;  __rev1_125 = __builtin_shufflevector(__s1_125, __s1_125, 3, 2, 1, 0); \
  22290   int16x4_t __rev2_125;  __rev2_125 = __builtin_shufflevector(__s2_125, __s2_125, 3, 2, 1, 0); \
  22291   __ret_125 = __noswap_vqdmlal_s16(__rev0_125, __rev1_125, __noswap_splat_lane_s16(__rev2_125, __p3_125)); \
  22292   __ret_125 = __builtin_shufflevector(__ret_125, __ret_125, 3, 2, 1, 0); \
  22293   __ret_125; \
  22294 })
  22295 #endif
  22296 
  22297 #ifdef __LITTLE_ENDIAN__
  22298 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  22299   int64x2_t __ret;
  22300   __ret = vqdmlal_s32(__p0, __p1, (int32x2_t) {__p2, __p2});
  22301   return __ret;
  22302 }
  22303 #else
  22304 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  22305   int64x2_t __ret;
  22306   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22307   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22308   __ret = __noswap_vqdmlal_s32(__rev0, __rev1, (int32x2_t) {__p2, __p2});
  22309   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22310   return __ret;
  22311 }
  22312 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  22313   int64x2_t __ret;
  22314   __ret = __noswap_vqdmlal_s32(__p0, __p1, (int32x2_t) {__p2, __p2});
  22315   return __ret;
  22316 }
  22317 #endif
  22318 
  22319 #ifdef __LITTLE_ENDIAN__
  22320 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  22321   int32x4_t __ret;
  22322   __ret = vqdmlal_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  22323   return __ret;
  22324 }
  22325 #else
  22326 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  22327   int32x4_t __ret;
  22328   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22329   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22330   __ret = __noswap_vqdmlal_s16(__rev0, __rev1, (int16x4_t) {__p2, __p2, __p2, __p2});
  22331   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22332   return __ret;
  22333 }
  22334 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  22335   int32x4_t __ret;
  22336   __ret = __noswap_vqdmlal_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  22337   return __ret;
  22338 }
  22339 #endif
  22340 
  22341 #ifdef __LITTLE_ENDIAN__
  22342 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  22343   int64x2_t __ret;
  22344   __ret = (int64x2_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35);
  22345   return __ret;
  22346 }
  22347 #else
  22348 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  22349   int64x2_t __ret;
  22350   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22351   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22352   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  22353   __ret = (int64x2_t) __builtin_neon_vqdmlsl_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 35);
  22354   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22355   return __ret;
  22356 }
  22357 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  22358   int64x2_t __ret;
  22359   __ret = (int64x2_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35);
  22360   return __ret;
  22361 }
  22362 #endif
  22363 
  22364 #ifdef __LITTLE_ENDIAN__
  22365 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  22366   int32x4_t __ret;
  22367   __ret = (int32x4_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34);
  22368   return __ret;
  22369 }
  22370 #else
  22371 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  22372   int32x4_t __ret;
  22373   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22374   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22375   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  22376   __ret = (int32x4_t) __builtin_neon_vqdmlsl_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 34);
  22377   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22378   return __ret;
  22379 }
  22380 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  22381   int32x4_t __ret;
  22382   __ret = (int32x4_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34);
  22383   return __ret;
  22384 }
  22385 #endif
  22386 
  22387 #ifdef __LITTLE_ENDIAN__
  22388 #define vqdmlsl_lane_s32(__p0_126, __p1_126, __p2_126, __p3_126) __extension__ ({ \
  22389   int64x2_t __ret_126; \
  22390   int64x2_t __s0_126 = __p0_126; \
  22391   int32x2_t __s1_126 = __p1_126; \
  22392   int32x2_t __s2_126 = __p2_126; \
  22393   __ret_126 = vqdmlsl_s32(__s0_126, __s1_126, splat_lane_s32(__s2_126, __p3_126)); \
  22394   __ret_126; \
  22395 })
  22396 #else
  22397 #define vqdmlsl_lane_s32(__p0_127, __p1_127, __p2_127, __p3_127) __extension__ ({ \
  22398   int64x2_t __ret_127; \
  22399   int64x2_t __s0_127 = __p0_127; \
  22400   int32x2_t __s1_127 = __p1_127; \
  22401   int32x2_t __s2_127 = __p2_127; \
  22402   int64x2_t __rev0_127;  __rev0_127 = __builtin_shufflevector(__s0_127, __s0_127, 1, 0); \
  22403   int32x2_t __rev1_127;  __rev1_127 = __builtin_shufflevector(__s1_127, __s1_127, 1, 0); \
  22404   int32x2_t __rev2_127;  __rev2_127 = __builtin_shufflevector(__s2_127, __s2_127, 1, 0); \
  22405   __ret_127 = __noswap_vqdmlsl_s32(__rev0_127, __rev1_127, __noswap_splat_lane_s32(__rev2_127, __p3_127)); \
  22406   __ret_127 = __builtin_shufflevector(__ret_127, __ret_127, 1, 0); \
  22407   __ret_127; \
  22408 })
  22409 #endif
  22410 
  22411 #ifdef __LITTLE_ENDIAN__
  22412 #define vqdmlsl_lane_s16(__p0_128, __p1_128, __p2_128, __p3_128) __extension__ ({ \
  22413   int32x4_t __ret_128; \
  22414   int32x4_t __s0_128 = __p0_128; \
  22415   int16x4_t __s1_128 = __p1_128; \
  22416   int16x4_t __s2_128 = __p2_128; \
  22417   __ret_128 = vqdmlsl_s16(__s0_128, __s1_128, splat_lane_s16(__s2_128, __p3_128)); \
  22418   __ret_128; \
  22419 })
  22420 #else
  22421 #define vqdmlsl_lane_s16(__p0_129, __p1_129, __p2_129, __p3_129) __extension__ ({ \
  22422   int32x4_t __ret_129; \
  22423   int32x4_t __s0_129 = __p0_129; \
  22424   int16x4_t __s1_129 = __p1_129; \
  22425   int16x4_t __s2_129 = __p2_129; \
  22426   int32x4_t __rev0_129;  __rev0_129 = __builtin_shufflevector(__s0_129, __s0_129, 3, 2, 1, 0); \
  22427   int16x4_t __rev1_129;  __rev1_129 = __builtin_shufflevector(__s1_129, __s1_129, 3, 2, 1, 0); \
  22428   int16x4_t __rev2_129;  __rev2_129 = __builtin_shufflevector(__s2_129, __s2_129, 3, 2, 1, 0); \
  22429   __ret_129 = __noswap_vqdmlsl_s16(__rev0_129, __rev1_129, __noswap_splat_lane_s16(__rev2_129, __p3_129)); \
  22430   __ret_129 = __builtin_shufflevector(__ret_129, __ret_129, 3, 2, 1, 0); \
  22431   __ret_129; \
  22432 })
  22433 #endif
  22434 
  22435 #ifdef __LITTLE_ENDIAN__
  22436 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  22437   int64x2_t __ret;
  22438   __ret = vqdmlsl_s32(__p0, __p1, (int32x2_t) {__p2, __p2});
  22439   return __ret;
  22440 }
  22441 #else
  22442 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  22443   int64x2_t __ret;
  22444   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22445   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22446   __ret = __noswap_vqdmlsl_s32(__rev0, __rev1, (int32x2_t) {__p2, __p2});
  22447   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22448   return __ret;
  22449 }
  22450 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  22451   int64x2_t __ret;
  22452   __ret = __noswap_vqdmlsl_s32(__p0, __p1, (int32x2_t) {__p2, __p2});
  22453   return __ret;
  22454 }
  22455 #endif
  22456 
  22457 #ifdef __LITTLE_ENDIAN__
  22458 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  22459   int32x4_t __ret;
  22460   __ret = vqdmlsl_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  22461   return __ret;
  22462 }
  22463 #else
  22464 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  22465   int32x4_t __ret;
  22466   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22467   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22468   __ret = __noswap_vqdmlsl_s16(__rev0, __rev1, (int16x4_t) {__p2, __p2, __p2, __p2});
  22469   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22470   return __ret;
  22471 }
  22472 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  22473   int32x4_t __ret;
  22474   __ret = __noswap_vqdmlsl_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  22475   return __ret;
  22476 }
  22477 #endif
  22478 
  22479 #ifdef __LITTLE_ENDIAN__
  22480 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_s32(int32x4_t __p0, int32x4_t __p1) {
  22481   int32x4_t __ret;
  22482   __ret = (int32x4_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  22483   return __ret;
  22484 }
  22485 #else
  22486 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_s32(int32x4_t __p0, int32x4_t __p1) {
  22487   int32x4_t __ret;
  22488   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22489   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22490   __ret = (int32x4_t) __builtin_neon_vqdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  22491   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22492   return __ret;
  22493 }
  22494 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmulhq_s32(int32x4_t __p0, int32x4_t __p1) {
  22495   int32x4_t __ret;
  22496   __ret = (int32x4_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  22497   return __ret;
  22498 }
  22499 #endif
  22500 
  22501 #ifdef __LITTLE_ENDIAN__
  22502 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_s16(int16x8_t __p0, int16x8_t __p1) {
  22503   int16x8_t __ret;
  22504   __ret = (int16x8_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  22505   return __ret;
  22506 }
  22507 #else
  22508 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_s16(int16x8_t __p0, int16x8_t __p1) {
  22509   int16x8_t __ret;
  22510   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22511   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  22512   __ret = (int16x8_t) __builtin_neon_vqdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  22513   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22514   return __ret;
  22515 }
  22516 __ai __attribute__((target("neon"))) int16x8_t __noswap_vqdmulhq_s16(int16x8_t __p0, int16x8_t __p1) {
  22517   int16x8_t __ret;
  22518   __ret = (int16x8_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  22519   return __ret;
  22520 }
  22521 #endif
  22522 
  22523 #ifdef __LITTLE_ENDIAN__
  22524 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_s32(int32x2_t __p0, int32x2_t __p1) {
  22525   int32x2_t __ret;
  22526   __ret = (int32x2_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  22527   return __ret;
  22528 }
  22529 #else
  22530 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_s32(int32x2_t __p0, int32x2_t __p1) {
  22531   int32x2_t __ret;
  22532   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22533   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22534   __ret = (int32x2_t) __builtin_neon_vqdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  22535   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22536   return __ret;
  22537 }
  22538 __ai __attribute__((target("neon"))) int32x2_t __noswap_vqdmulh_s32(int32x2_t __p0, int32x2_t __p1) {
  22539   int32x2_t __ret;
  22540   __ret = (int32x2_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  22541   return __ret;
  22542 }
  22543 #endif
  22544 
  22545 #ifdef __LITTLE_ENDIAN__
  22546 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_s16(int16x4_t __p0, int16x4_t __p1) {
  22547   int16x4_t __ret;
  22548   __ret = (int16x4_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  22549   return __ret;
  22550 }
  22551 #else
  22552 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_s16(int16x4_t __p0, int16x4_t __p1) {
  22553   int16x4_t __ret;
  22554   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22555   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22556   __ret = (int16x4_t) __builtin_neon_vqdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  22557   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22558   return __ret;
  22559 }
  22560 __ai __attribute__((target("neon"))) int16x4_t __noswap_vqdmulh_s16(int16x4_t __p0, int16x4_t __p1) {
  22561   int16x4_t __ret;
  22562   __ret = (int16x4_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  22563   return __ret;
  22564 }
  22565 #endif
  22566 
  22567 #ifdef __LITTLE_ENDIAN__
  22568 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_n_s32(int32x4_t __p0, int32_t __p1) {
  22569   int32x4_t __ret;
  22570   __ret = vqdmulhq_s32(__p0, (int32x4_t) {__p1, __p1, __p1, __p1});
  22571   return __ret;
  22572 }
  22573 #else
  22574 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_n_s32(int32x4_t __p0, int32_t __p1) {
  22575   int32x4_t __ret;
  22576   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22577   __ret = __noswap_vqdmulhq_s32(__rev0, (int32x4_t) {__p1, __p1, __p1, __p1});
  22578   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22579   return __ret;
  22580 }
  22581 #endif
  22582 
  22583 #ifdef __LITTLE_ENDIAN__
  22584 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_n_s16(int16x8_t __p0, int16_t __p1) {
  22585   int16x8_t __ret;
  22586   __ret = vqdmulhq_s16(__p0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1});
  22587   return __ret;
  22588 }
  22589 #else
  22590 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_n_s16(int16x8_t __p0, int16_t __p1) {
  22591   int16x8_t __ret;
  22592   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22593   __ret = __noswap_vqdmulhq_s16(__rev0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1});
  22594   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22595   return __ret;
  22596 }
  22597 #endif
  22598 
  22599 #ifdef __LITTLE_ENDIAN__
  22600 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_n_s32(int32x2_t __p0, int32_t __p1) {
  22601   int32x2_t __ret;
  22602   __ret = vqdmulh_s32(__p0, (int32x2_t) {__p1, __p1});
  22603   return __ret;
  22604 }
  22605 #else
  22606 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_n_s32(int32x2_t __p0, int32_t __p1) {
  22607   int32x2_t __ret;
  22608   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22609   __ret = __noswap_vqdmulh_s32(__rev0, (int32x2_t) {__p1, __p1});
  22610   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22611   return __ret;
  22612 }
  22613 #endif
  22614 
  22615 #ifdef __LITTLE_ENDIAN__
  22616 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_n_s16(int16x4_t __p0, int16_t __p1) {
  22617   int16x4_t __ret;
  22618   __ret = vqdmulh_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1});
  22619   return __ret;
  22620 }
  22621 #else
  22622 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_n_s16(int16x4_t __p0, int16_t __p1) {
  22623   int16x4_t __ret;
  22624   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22625   __ret = __noswap_vqdmulh_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1});
  22626   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22627   return __ret;
  22628 }
  22629 #endif
  22630 
  22631 #ifdef __LITTLE_ENDIAN__
  22632 __ai __attribute__((target("neon"))) int64x2_t vqdmull_s32(int32x2_t __p0, int32x2_t __p1) {
  22633   int64x2_t __ret;
  22634   __ret = (int64x2_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35);
  22635   return __ret;
  22636 }
  22637 #else
  22638 __ai __attribute__((target("neon"))) int64x2_t vqdmull_s32(int32x2_t __p0, int32x2_t __p1) {
  22639   int64x2_t __ret;
  22640   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22641   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  22642   __ret = (int64x2_t) __builtin_neon_vqdmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 35);
  22643   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22644   return __ret;
  22645 }
  22646 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmull_s32(int32x2_t __p0, int32x2_t __p1) {
  22647   int64x2_t __ret;
  22648   __ret = (int64x2_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35);
  22649   return __ret;
  22650 }
  22651 #endif
  22652 
  22653 #ifdef __LITTLE_ENDIAN__
  22654 __ai __attribute__((target("neon"))) int32x4_t vqdmull_s16(int16x4_t __p0, int16x4_t __p1) {
  22655   int32x4_t __ret;
  22656   __ret = (int32x4_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34);
  22657   return __ret;
  22658 }
  22659 #else
  22660 __ai __attribute__((target("neon"))) int32x4_t vqdmull_s16(int16x4_t __p0, int16x4_t __p1) {
  22661   int32x4_t __ret;
  22662   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22663   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  22664   __ret = (int32x4_t) __builtin_neon_vqdmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 34);
  22665   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22666   return __ret;
  22667 }
  22668 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmull_s16(int16x4_t __p0, int16x4_t __p1) {
  22669   int32x4_t __ret;
  22670   __ret = (int32x4_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34);
  22671   return __ret;
  22672 }
  22673 #endif
  22674 
  22675 #ifdef __LITTLE_ENDIAN__
  22676 #define vqdmull_lane_s32(__p0_130, __p1_130, __p2_130) __extension__ ({ \
  22677   int64x2_t __ret_130; \
  22678   int32x2_t __s0_130 = __p0_130; \
  22679   int32x2_t __s1_130 = __p1_130; \
  22680   __ret_130 = vqdmull_s32(__s0_130, splat_lane_s32(__s1_130, __p2_130)); \
  22681   __ret_130; \
  22682 })
  22683 #else
  22684 #define vqdmull_lane_s32(__p0_131, __p1_131, __p2_131) __extension__ ({ \
  22685   int64x2_t __ret_131; \
  22686   int32x2_t __s0_131 = __p0_131; \
  22687   int32x2_t __s1_131 = __p1_131; \
  22688   int32x2_t __rev0_131;  __rev0_131 = __builtin_shufflevector(__s0_131, __s0_131, 1, 0); \
  22689   int32x2_t __rev1_131;  __rev1_131 = __builtin_shufflevector(__s1_131, __s1_131, 1, 0); \
  22690   __ret_131 = __noswap_vqdmull_s32(__rev0_131, __noswap_splat_lane_s32(__rev1_131, __p2_131)); \
  22691   __ret_131 = __builtin_shufflevector(__ret_131, __ret_131, 1, 0); \
  22692   __ret_131; \
  22693 })
  22694 #endif
  22695 
  22696 #ifdef __LITTLE_ENDIAN__
  22697 #define vqdmull_lane_s16(__p0_132, __p1_132, __p2_132) __extension__ ({ \
  22698   int32x4_t __ret_132; \
  22699   int16x4_t __s0_132 = __p0_132; \
  22700   int16x4_t __s1_132 = __p1_132; \
  22701   __ret_132 = vqdmull_s16(__s0_132, splat_lane_s16(__s1_132, __p2_132)); \
  22702   __ret_132; \
  22703 })
  22704 #else
  22705 #define vqdmull_lane_s16(__p0_133, __p1_133, __p2_133) __extension__ ({ \
  22706   int32x4_t __ret_133; \
  22707   int16x4_t __s0_133 = __p0_133; \
  22708   int16x4_t __s1_133 = __p1_133; \
  22709   int16x4_t __rev0_133;  __rev0_133 = __builtin_shufflevector(__s0_133, __s0_133, 3, 2, 1, 0); \
  22710   int16x4_t __rev1_133;  __rev1_133 = __builtin_shufflevector(__s1_133, __s1_133, 3, 2, 1, 0); \
  22711   __ret_133 = __noswap_vqdmull_s16(__rev0_133, __noswap_splat_lane_s16(__rev1_133, __p2_133)); \
  22712   __ret_133 = __builtin_shufflevector(__ret_133, __ret_133, 3, 2, 1, 0); \
  22713   __ret_133; \
  22714 })
  22715 #endif
  22716 
  22717 #ifdef __LITTLE_ENDIAN__
  22718 __ai __attribute__((target("neon"))) int64x2_t vqdmull_n_s32(int32x2_t __p0, int32_t __p1) {
  22719   int64x2_t __ret;
  22720   __ret = vqdmull_s32(__p0, (int32x2_t) {__p1, __p1});
  22721   return __ret;
  22722 }
  22723 #else
  22724 __ai __attribute__((target("neon"))) int64x2_t vqdmull_n_s32(int32x2_t __p0, int32_t __p1) {
  22725   int64x2_t __ret;
  22726   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22727   __ret = __noswap_vqdmull_s32(__rev0, (int32x2_t) {__p1, __p1});
  22728   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22729   return __ret;
  22730 }
  22731 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmull_n_s32(int32x2_t __p0, int32_t __p1) {
  22732   int64x2_t __ret;
  22733   __ret = __noswap_vqdmull_s32(__p0, (int32x2_t) {__p1, __p1});
  22734   return __ret;
  22735 }
  22736 #endif
  22737 
  22738 #ifdef __LITTLE_ENDIAN__
  22739 __ai __attribute__((target("neon"))) int32x4_t vqdmull_n_s16(int16x4_t __p0, int16_t __p1) {
  22740   int32x4_t __ret;
  22741   __ret = vqdmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1});
  22742   return __ret;
  22743 }
  22744 #else
  22745 __ai __attribute__((target("neon"))) int32x4_t vqdmull_n_s16(int16x4_t __p0, int16_t __p1) {
  22746   int32x4_t __ret;
  22747   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22748   __ret = __noswap_vqdmull_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1});
  22749   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22750   return __ret;
  22751 }
  22752 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmull_n_s16(int16x4_t __p0, int16_t __p1) {
  22753   int32x4_t __ret;
  22754   __ret = __noswap_vqdmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1});
  22755   return __ret;
  22756 }
  22757 #endif
  22758 
  22759 #ifdef __LITTLE_ENDIAN__
  22760 __ai __attribute__((target("neon"))) uint16x4_t vqmovn_u32(uint32x4_t __p0) {
  22761   uint16x4_t __ret;
  22762   __ret = (uint16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 17);
  22763   return __ret;
  22764 }
  22765 #else
  22766 __ai __attribute__((target("neon"))) uint16x4_t vqmovn_u32(uint32x4_t __p0) {
  22767   uint16x4_t __ret;
  22768   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22769   __ret = (uint16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 17);
  22770   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22771   return __ret;
  22772 }
  22773 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vqmovn_u32(uint32x4_t __p0) {
  22774   uint16x4_t __ret;
  22775   __ret = (uint16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 17);
  22776   return __ret;
  22777 }
  22778 #endif
  22779 
  22780 #ifdef __LITTLE_ENDIAN__
  22781 __ai __attribute__((target("neon"))) uint32x2_t vqmovn_u64(uint64x2_t __p0) {
  22782   uint32x2_t __ret;
  22783   __ret = (uint32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 18);
  22784   return __ret;
  22785 }
  22786 #else
  22787 __ai __attribute__((target("neon"))) uint32x2_t vqmovn_u64(uint64x2_t __p0) {
  22788   uint32x2_t __ret;
  22789   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22790   __ret = (uint32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 18);
  22791   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22792   return __ret;
  22793 }
  22794 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vqmovn_u64(uint64x2_t __p0) {
  22795   uint32x2_t __ret;
  22796   __ret = (uint32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 18);
  22797   return __ret;
  22798 }
  22799 #endif
  22800 
  22801 #ifdef __LITTLE_ENDIAN__
  22802 __ai __attribute__((target("neon"))) uint8x8_t vqmovn_u16(uint16x8_t __p0) {
  22803   uint8x8_t __ret;
  22804   __ret = (uint8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 16);
  22805   return __ret;
  22806 }
  22807 #else
  22808 __ai __attribute__((target("neon"))) uint8x8_t vqmovn_u16(uint16x8_t __p0) {
  22809   uint8x8_t __ret;
  22810   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22811   __ret = (uint8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 16);
  22812   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22813   return __ret;
  22814 }
  22815 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vqmovn_u16(uint16x8_t __p0) {
  22816   uint8x8_t __ret;
  22817   __ret = (uint8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 16);
  22818   return __ret;
  22819 }
  22820 #endif
  22821 
  22822 #ifdef __LITTLE_ENDIAN__
  22823 __ai __attribute__((target("neon"))) int16x4_t vqmovn_s32(int32x4_t __p0) {
  22824   int16x4_t __ret;
  22825   __ret = (int16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 1);
  22826   return __ret;
  22827 }
  22828 #else
  22829 __ai __attribute__((target("neon"))) int16x4_t vqmovn_s32(int32x4_t __p0) {
  22830   int16x4_t __ret;
  22831   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22832   __ret = (int16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 1);
  22833   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22834   return __ret;
  22835 }
  22836 __ai __attribute__((target("neon"))) int16x4_t __noswap_vqmovn_s32(int32x4_t __p0) {
  22837   int16x4_t __ret;
  22838   __ret = (int16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 1);
  22839   return __ret;
  22840 }
  22841 #endif
  22842 
  22843 #ifdef __LITTLE_ENDIAN__
  22844 __ai __attribute__((target("neon"))) int32x2_t vqmovn_s64(int64x2_t __p0) {
  22845   int32x2_t __ret;
  22846   __ret = (int32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 2);
  22847   return __ret;
  22848 }
  22849 #else
  22850 __ai __attribute__((target("neon"))) int32x2_t vqmovn_s64(int64x2_t __p0) {
  22851   int32x2_t __ret;
  22852   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22853   __ret = (int32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 2);
  22854   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22855   return __ret;
  22856 }
  22857 __ai __attribute__((target("neon"))) int32x2_t __noswap_vqmovn_s64(int64x2_t __p0) {
  22858   int32x2_t __ret;
  22859   __ret = (int32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 2);
  22860   return __ret;
  22861 }
  22862 #endif
  22863 
  22864 #ifdef __LITTLE_ENDIAN__
  22865 __ai __attribute__((target("neon"))) int8x8_t vqmovn_s16(int16x8_t __p0) {
  22866   int8x8_t __ret;
  22867   __ret = (int8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 0);
  22868   return __ret;
  22869 }
  22870 #else
  22871 __ai __attribute__((target("neon"))) int8x8_t vqmovn_s16(int16x8_t __p0) {
  22872   int8x8_t __ret;
  22873   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22874   __ret = (int8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 0);
  22875   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22876   return __ret;
  22877 }
  22878 __ai __attribute__((target("neon"))) int8x8_t __noswap_vqmovn_s16(int16x8_t __p0) {
  22879   int8x8_t __ret;
  22880   __ret = (int8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 0);
  22881   return __ret;
  22882 }
  22883 #endif
  22884 
  22885 #ifdef __LITTLE_ENDIAN__
  22886 __ai __attribute__((target("neon"))) uint16x4_t vqmovun_s32(int32x4_t __p0) {
  22887   uint16x4_t __ret;
  22888   __ret = (uint16x4_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 17);
  22889   return __ret;
  22890 }
  22891 #else
  22892 __ai __attribute__((target("neon"))) uint16x4_t vqmovun_s32(int32x4_t __p0) {
  22893   uint16x4_t __ret;
  22894   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22895   __ret = (uint16x4_t) __builtin_neon_vqmovun_v((int8x16_t)__rev0, 17);
  22896   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22897   return __ret;
  22898 }
  22899 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vqmovun_s32(int32x4_t __p0) {
  22900   uint16x4_t __ret;
  22901   __ret = (uint16x4_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 17);
  22902   return __ret;
  22903 }
  22904 #endif
  22905 
  22906 #ifdef __LITTLE_ENDIAN__
  22907 __ai __attribute__((target("neon"))) uint32x2_t vqmovun_s64(int64x2_t __p0) {
  22908   uint32x2_t __ret;
  22909   __ret = (uint32x2_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 18);
  22910   return __ret;
  22911 }
  22912 #else
  22913 __ai __attribute__((target("neon"))) uint32x2_t vqmovun_s64(int64x2_t __p0) {
  22914   uint32x2_t __ret;
  22915   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  22916   __ret = (uint32x2_t) __builtin_neon_vqmovun_v((int8x16_t)__rev0, 18);
  22917   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  22918   return __ret;
  22919 }
  22920 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vqmovun_s64(int64x2_t __p0) {
  22921   uint32x2_t __ret;
  22922   __ret = (uint32x2_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 18);
  22923   return __ret;
  22924 }
  22925 #endif
  22926 
  22927 #ifdef __LITTLE_ENDIAN__
  22928 __ai __attribute__((target("neon"))) uint8x8_t vqmovun_s16(int16x8_t __p0) {
  22929   uint8x8_t __ret;
  22930   __ret = (uint8x8_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 16);
  22931   return __ret;
  22932 }
  22933 #else
  22934 __ai __attribute__((target("neon"))) uint8x8_t vqmovun_s16(int16x8_t __p0) {
  22935   uint8x8_t __ret;
  22936   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22937   __ret = (uint8x8_t) __builtin_neon_vqmovun_v((int8x16_t)__rev0, 16);
  22938   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22939   return __ret;
  22940 }
  22941 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vqmovun_s16(int16x8_t __p0) {
  22942   uint8x8_t __ret;
  22943   __ret = (uint8x8_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 16);
  22944   return __ret;
  22945 }
  22946 #endif
  22947 
  22948 #ifdef __LITTLE_ENDIAN__
  22949 __ai __attribute__((target("neon"))) int8x16_t vqnegq_s8(int8x16_t __p0) {
  22950   int8x16_t __ret;
  22951   __ret = (int8x16_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 32);
  22952   return __ret;
  22953 }
  22954 #else
  22955 __ai __attribute__((target("neon"))) int8x16_t vqnegq_s8(int8x16_t __p0) {
  22956   int8x16_t __ret;
  22957   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  22958   __ret = (int8x16_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 32);
  22959   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  22960   return __ret;
  22961 }
  22962 #endif
  22963 
  22964 #ifdef __LITTLE_ENDIAN__
  22965 __ai __attribute__((target("neon"))) int32x4_t vqnegq_s32(int32x4_t __p0) {
  22966   int32x4_t __ret;
  22967   __ret = (int32x4_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 34);
  22968   return __ret;
  22969 }
  22970 #else
  22971 __ai __attribute__((target("neon"))) int32x4_t vqnegq_s32(int32x4_t __p0) {
  22972   int32x4_t __ret;
  22973   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  22974   __ret = (int32x4_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 34);
  22975   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  22976   return __ret;
  22977 }
  22978 #endif
  22979 
  22980 #ifdef __LITTLE_ENDIAN__
  22981 __ai __attribute__((target("neon"))) int16x8_t vqnegq_s16(int16x8_t __p0) {
  22982   int16x8_t __ret;
  22983   __ret = (int16x8_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 33);
  22984   return __ret;
  22985 }
  22986 #else
  22987 __ai __attribute__((target("neon"))) int16x8_t vqnegq_s16(int16x8_t __p0) {
  22988   int16x8_t __ret;
  22989   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  22990   __ret = (int16x8_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 33);
  22991   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  22992   return __ret;
  22993 }
  22994 #endif
  22995 
  22996 #ifdef __LITTLE_ENDIAN__
  22997 __ai __attribute__((target("neon"))) int8x8_t vqneg_s8(int8x8_t __p0) {
  22998   int8x8_t __ret;
  22999   __ret = (int8x8_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 0);
  23000   return __ret;
  23001 }
  23002 #else
  23003 __ai __attribute__((target("neon"))) int8x8_t vqneg_s8(int8x8_t __p0) {
  23004   int8x8_t __ret;
  23005   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23006   __ret = (int8x8_t) __builtin_neon_vqneg_v((int8x8_t)__rev0, 0);
  23007   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23008   return __ret;
  23009 }
  23010 #endif
  23011 
  23012 #ifdef __LITTLE_ENDIAN__
  23013 __ai __attribute__((target("neon"))) int32x2_t vqneg_s32(int32x2_t __p0) {
  23014   int32x2_t __ret;
  23015   __ret = (int32x2_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 2);
  23016   return __ret;
  23017 }
  23018 #else
  23019 __ai __attribute__((target("neon"))) int32x2_t vqneg_s32(int32x2_t __p0) {
  23020   int32x2_t __ret;
  23021   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23022   __ret = (int32x2_t) __builtin_neon_vqneg_v((int8x8_t)__rev0, 2);
  23023   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23024   return __ret;
  23025 }
  23026 #endif
  23027 
  23028 #ifdef __LITTLE_ENDIAN__
  23029 __ai __attribute__((target("neon"))) int16x4_t vqneg_s16(int16x4_t __p0) {
  23030   int16x4_t __ret;
  23031   __ret = (int16x4_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 1);
  23032   return __ret;
  23033 }
  23034 #else
  23035 __ai __attribute__((target("neon"))) int16x4_t vqneg_s16(int16x4_t __p0) {
  23036   int16x4_t __ret;
  23037   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23038   __ret = (int16x4_t) __builtin_neon_vqneg_v((int8x8_t)__rev0, 1);
  23039   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23040   return __ret;
  23041 }
  23042 #endif
  23043 
  23044 #ifdef __LITTLE_ENDIAN__
  23045 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_s32(int32x4_t __p0, int32x4_t __p1) {
  23046   int32x4_t __ret;
  23047   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  23048   return __ret;
  23049 }
  23050 #else
  23051 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_s32(int32x4_t __p0, int32x4_t __p1) {
  23052   int32x4_t __ret;
  23053   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23054   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23055   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  23056   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23057   return __ret;
  23058 }
  23059 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqrdmulhq_s32(int32x4_t __p0, int32x4_t __p1) {
  23060   int32x4_t __ret;
  23061   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  23062   return __ret;
  23063 }
  23064 #endif
  23065 
  23066 #ifdef __LITTLE_ENDIAN__
  23067 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_s16(int16x8_t __p0, int16x8_t __p1) {
  23068   int16x8_t __ret;
  23069   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  23070   return __ret;
  23071 }
  23072 #else
  23073 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_s16(int16x8_t __p0, int16x8_t __p1) {
  23074   int16x8_t __ret;
  23075   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23076   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23077   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  23078   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23079   return __ret;
  23080 }
  23081 __ai __attribute__((target("neon"))) int16x8_t __noswap_vqrdmulhq_s16(int16x8_t __p0, int16x8_t __p1) {
  23082   int16x8_t __ret;
  23083   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  23084   return __ret;
  23085 }
  23086 #endif
  23087 
  23088 #ifdef __LITTLE_ENDIAN__
  23089 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_s32(int32x2_t __p0, int32x2_t __p1) {
  23090   int32x2_t __ret;
  23091   __ret = (int32x2_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  23092   return __ret;
  23093 }
  23094 #else
  23095 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_s32(int32x2_t __p0, int32x2_t __p1) {
  23096   int32x2_t __ret;
  23097   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23098   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23099   __ret = (int32x2_t) __builtin_neon_vqrdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  23100   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23101   return __ret;
  23102 }
  23103 __ai __attribute__((target("neon"))) int32x2_t __noswap_vqrdmulh_s32(int32x2_t __p0, int32x2_t __p1) {
  23104   int32x2_t __ret;
  23105   __ret = (int32x2_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  23106   return __ret;
  23107 }
  23108 #endif
  23109 
  23110 #ifdef __LITTLE_ENDIAN__
  23111 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_s16(int16x4_t __p0, int16x4_t __p1) {
  23112   int16x4_t __ret;
  23113   __ret = (int16x4_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  23114   return __ret;
  23115 }
  23116 #else
  23117 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_s16(int16x4_t __p0, int16x4_t __p1) {
  23118   int16x4_t __ret;
  23119   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23120   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23121   __ret = (int16x4_t) __builtin_neon_vqrdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  23122   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23123   return __ret;
  23124 }
  23125 __ai __attribute__((target("neon"))) int16x4_t __noswap_vqrdmulh_s16(int16x4_t __p0, int16x4_t __p1) {
  23126   int16x4_t __ret;
  23127   __ret = (int16x4_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  23128   return __ret;
  23129 }
  23130 #endif
  23131 
  23132 #ifdef __LITTLE_ENDIAN__
  23133 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_n_s32(int32x4_t __p0, int32_t __p1) {
  23134   int32x4_t __ret;
  23135   __ret = vqrdmulhq_s32(__p0, (int32x4_t) {__p1, __p1, __p1, __p1});
  23136   return __ret;
  23137 }
  23138 #else
  23139 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_n_s32(int32x4_t __p0, int32_t __p1) {
  23140   int32x4_t __ret;
  23141   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23142   __ret = __noswap_vqrdmulhq_s32(__rev0, (int32x4_t) {__p1, __p1, __p1, __p1});
  23143   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23144   return __ret;
  23145 }
  23146 #endif
  23147 
  23148 #ifdef __LITTLE_ENDIAN__
  23149 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_n_s16(int16x8_t __p0, int16_t __p1) {
  23150   int16x8_t __ret;
  23151   __ret = vqrdmulhq_s16(__p0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1});
  23152   return __ret;
  23153 }
  23154 #else
  23155 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_n_s16(int16x8_t __p0, int16_t __p1) {
  23156   int16x8_t __ret;
  23157   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23158   __ret = __noswap_vqrdmulhq_s16(__rev0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1});
  23159   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23160   return __ret;
  23161 }
  23162 #endif
  23163 
  23164 #ifdef __LITTLE_ENDIAN__
  23165 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_n_s32(int32x2_t __p0, int32_t __p1) {
  23166   int32x2_t __ret;
  23167   __ret = vqrdmulh_s32(__p0, (int32x2_t) {__p1, __p1});
  23168   return __ret;
  23169 }
  23170 #else
  23171 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_n_s32(int32x2_t __p0, int32_t __p1) {
  23172   int32x2_t __ret;
  23173   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23174   __ret = __noswap_vqrdmulh_s32(__rev0, (int32x2_t) {__p1, __p1});
  23175   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23176   return __ret;
  23177 }
  23178 #endif
  23179 
  23180 #ifdef __LITTLE_ENDIAN__
  23181 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_n_s16(int16x4_t __p0, int16_t __p1) {
  23182   int16x4_t __ret;
  23183   __ret = vqrdmulh_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1});
  23184   return __ret;
  23185 }
  23186 #else
  23187 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_n_s16(int16x4_t __p0, int16_t __p1) {
  23188   int16x4_t __ret;
  23189   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23190   __ret = __noswap_vqrdmulh_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1});
  23191   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23192   return __ret;
  23193 }
  23194 #endif
  23195 
  23196 #ifdef __LITTLE_ENDIAN__
  23197 __ai __attribute__((target("neon"))) uint8x16_t vqrshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  23198   uint8x16_t __ret;
  23199   __ret = (uint8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  23200   return __ret;
  23201 }
  23202 #else
  23203 __ai __attribute__((target("neon"))) uint8x16_t vqrshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  23204   uint8x16_t __ret;
  23205   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23206   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23207   __ret = (uint8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  23208   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23209   return __ret;
  23210 }
  23211 #endif
  23212 
  23213 #ifdef __LITTLE_ENDIAN__
  23214 __ai __attribute__((target("neon"))) uint32x4_t vqrshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  23215   uint32x4_t __ret;
  23216   __ret = (uint32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  23217   return __ret;
  23218 }
  23219 #else
  23220 __ai __attribute__((target("neon"))) uint32x4_t vqrshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  23221   uint32x4_t __ret;
  23222   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23223   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23224   __ret = (uint32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  23225   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23226   return __ret;
  23227 }
  23228 #endif
  23229 
  23230 #ifdef __LITTLE_ENDIAN__
  23231 __ai __attribute__((target("neon"))) uint64x2_t vqrshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  23232   uint64x2_t __ret;
  23233   __ret = (uint64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  23234   return __ret;
  23235 }
  23236 #else
  23237 __ai __attribute__((target("neon"))) uint64x2_t vqrshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  23238   uint64x2_t __ret;
  23239   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23240   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23241   __ret = (uint64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  23242   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23243   return __ret;
  23244 }
  23245 #endif
  23246 
  23247 #ifdef __LITTLE_ENDIAN__
  23248 __ai __attribute__((target("neon"))) uint16x8_t vqrshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  23249   uint16x8_t __ret;
  23250   __ret = (uint16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  23251   return __ret;
  23252 }
  23253 #else
  23254 __ai __attribute__((target("neon"))) uint16x8_t vqrshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  23255   uint16x8_t __ret;
  23256   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23257   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23258   __ret = (uint16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  23259   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23260   return __ret;
  23261 }
  23262 #endif
  23263 
  23264 #ifdef __LITTLE_ENDIAN__
  23265 __ai __attribute__((target("neon"))) int8x16_t vqrshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  23266   int8x16_t __ret;
  23267   __ret = (int8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  23268   return __ret;
  23269 }
  23270 #else
  23271 __ai __attribute__((target("neon"))) int8x16_t vqrshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  23272   int8x16_t __ret;
  23273   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23274   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23275   __ret = (int8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  23276   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23277   return __ret;
  23278 }
  23279 #endif
  23280 
  23281 #ifdef __LITTLE_ENDIAN__
  23282 __ai __attribute__((target("neon"))) int32x4_t vqrshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  23283   int32x4_t __ret;
  23284   __ret = (int32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  23285   return __ret;
  23286 }
  23287 #else
  23288 __ai __attribute__((target("neon"))) int32x4_t vqrshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  23289   int32x4_t __ret;
  23290   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23291   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23292   __ret = (int32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  23293   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23294   return __ret;
  23295 }
  23296 #endif
  23297 
  23298 #ifdef __LITTLE_ENDIAN__
  23299 __ai __attribute__((target("neon"))) int64x2_t vqrshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  23300   int64x2_t __ret;
  23301   __ret = (int64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  23302   return __ret;
  23303 }
  23304 #else
  23305 __ai __attribute__((target("neon"))) int64x2_t vqrshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  23306   int64x2_t __ret;
  23307   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23308   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23309   __ret = (int64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  23310   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23311   return __ret;
  23312 }
  23313 #endif
  23314 
  23315 #ifdef __LITTLE_ENDIAN__
  23316 __ai __attribute__((target("neon"))) int16x8_t vqrshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  23317   int16x8_t __ret;
  23318   __ret = (int16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  23319   return __ret;
  23320 }
  23321 #else
  23322 __ai __attribute__((target("neon"))) int16x8_t vqrshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  23323   int16x8_t __ret;
  23324   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23325   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23326   __ret = (int16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  23327   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23328   return __ret;
  23329 }
  23330 #endif
  23331 
  23332 #ifdef __LITTLE_ENDIAN__
  23333 __ai __attribute__((target("neon"))) uint8x8_t vqrshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  23334   uint8x8_t __ret;
  23335   __ret = (uint8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  23336   return __ret;
  23337 }
  23338 #else
  23339 __ai __attribute__((target("neon"))) uint8x8_t vqrshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  23340   uint8x8_t __ret;
  23341   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23342   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23343   __ret = (uint8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  23344   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23345   return __ret;
  23346 }
  23347 #endif
  23348 
  23349 #ifdef __LITTLE_ENDIAN__
  23350 __ai __attribute__((target("neon"))) uint32x2_t vqrshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  23351   uint32x2_t __ret;
  23352   __ret = (uint32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  23353   return __ret;
  23354 }
  23355 #else
  23356 __ai __attribute__((target("neon"))) uint32x2_t vqrshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  23357   uint32x2_t __ret;
  23358   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23359   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23360   __ret = (uint32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  23361   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23362   return __ret;
  23363 }
  23364 #endif
  23365 
  23366 __ai __attribute__((target("neon"))) uint64x1_t vqrshl_u64(uint64x1_t __p0, int64x1_t __p1) {
  23367   uint64x1_t __ret;
  23368   __ret = (uint64x1_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  23369   return __ret;
  23370 }
  23371 #ifdef __LITTLE_ENDIAN__
  23372 __ai __attribute__((target("neon"))) uint16x4_t vqrshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  23373   uint16x4_t __ret;
  23374   __ret = (uint16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  23375   return __ret;
  23376 }
  23377 #else
  23378 __ai __attribute__((target("neon"))) uint16x4_t vqrshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  23379   uint16x4_t __ret;
  23380   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23381   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23382   __ret = (uint16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  23383   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23384   return __ret;
  23385 }
  23386 #endif
  23387 
  23388 #ifdef __LITTLE_ENDIAN__
  23389 __ai __attribute__((target("neon"))) int8x8_t vqrshl_s8(int8x8_t __p0, int8x8_t __p1) {
  23390   int8x8_t __ret;
  23391   __ret = (int8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  23392   return __ret;
  23393 }
  23394 #else
  23395 __ai __attribute__((target("neon"))) int8x8_t vqrshl_s8(int8x8_t __p0, int8x8_t __p1) {
  23396   int8x8_t __ret;
  23397   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23398   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23399   __ret = (int8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  23400   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23401   return __ret;
  23402 }
  23403 #endif
  23404 
  23405 #ifdef __LITTLE_ENDIAN__
  23406 __ai __attribute__((target("neon"))) int32x2_t vqrshl_s32(int32x2_t __p0, int32x2_t __p1) {
  23407   int32x2_t __ret;
  23408   __ret = (int32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  23409   return __ret;
  23410 }
  23411 #else
  23412 __ai __attribute__((target("neon"))) int32x2_t vqrshl_s32(int32x2_t __p0, int32x2_t __p1) {
  23413   int32x2_t __ret;
  23414   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23415   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23416   __ret = (int32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  23417   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23418   return __ret;
  23419 }
  23420 #endif
  23421 
  23422 __ai __attribute__((target("neon"))) int64x1_t vqrshl_s64(int64x1_t __p0, int64x1_t __p1) {
  23423   int64x1_t __ret;
  23424   __ret = (int64x1_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  23425   return __ret;
  23426 }
  23427 #ifdef __LITTLE_ENDIAN__
  23428 __ai __attribute__((target("neon"))) int16x4_t vqrshl_s16(int16x4_t __p0, int16x4_t __p1) {
  23429   int16x4_t __ret;
  23430   __ret = (int16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  23431   return __ret;
  23432 }
  23433 #else
  23434 __ai __attribute__((target("neon"))) int16x4_t vqrshl_s16(int16x4_t __p0, int16x4_t __p1) {
  23435   int16x4_t __ret;
  23436   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23437   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23438   __ret = (int16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  23439   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23440   return __ret;
  23441 }
  23442 #endif
  23443 
  23444 #ifdef __LITTLE_ENDIAN__
  23445 #define vqrshrn_n_u32(__p0, __p1) __extension__ ({ \
  23446   uint16x4_t __ret; \
  23447   uint32x4_t __s0 = __p0; \
  23448   __ret = (uint16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 17); \
  23449   __ret; \
  23450 })
  23451 #else
  23452 #define vqrshrn_n_u32(__p0, __p1) __extension__ ({ \
  23453   uint16x4_t __ret; \
  23454   uint32x4_t __s0 = __p0; \
  23455   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  23456   __ret = (uint16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 17); \
  23457   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  23458   __ret; \
  23459 })
  23460 #define __noswap_vqrshrn_n_u32(__p0, __p1) __extension__ ({ \
  23461   uint16x4_t __ret; \
  23462   uint32x4_t __s0 = __p0; \
  23463   __ret = (uint16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 17); \
  23464   __ret; \
  23465 })
  23466 #endif
  23467 
  23468 #ifdef __LITTLE_ENDIAN__
  23469 #define vqrshrn_n_u64(__p0, __p1) __extension__ ({ \
  23470   uint32x2_t __ret; \
  23471   uint64x2_t __s0 = __p0; \
  23472   __ret = (uint32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 18); \
  23473   __ret; \
  23474 })
  23475 #else
  23476 #define vqrshrn_n_u64(__p0, __p1) __extension__ ({ \
  23477   uint32x2_t __ret; \
  23478   uint64x2_t __s0 = __p0; \
  23479   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  23480   __ret = (uint32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 18); \
  23481   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  23482   __ret; \
  23483 })
  23484 #define __noswap_vqrshrn_n_u64(__p0, __p1) __extension__ ({ \
  23485   uint32x2_t __ret; \
  23486   uint64x2_t __s0 = __p0; \
  23487   __ret = (uint32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 18); \
  23488   __ret; \
  23489 })
  23490 #endif
  23491 
  23492 #ifdef __LITTLE_ENDIAN__
  23493 #define vqrshrn_n_u16(__p0, __p1) __extension__ ({ \
  23494   uint8x8_t __ret; \
  23495   uint16x8_t __s0 = __p0; \
  23496   __ret = (uint8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 16); \
  23497   __ret; \
  23498 })
  23499 #else
  23500 #define vqrshrn_n_u16(__p0, __p1) __extension__ ({ \
  23501   uint8x8_t __ret; \
  23502   uint16x8_t __s0 = __p0; \
  23503   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  23504   __ret = (uint8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 16); \
  23505   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  23506   __ret; \
  23507 })
  23508 #define __noswap_vqrshrn_n_u16(__p0, __p1) __extension__ ({ \
  23509   uint8x8_t __ret; \
  23510   uint16x8_t __s0 = __p0; \
  23511   __ret = (uint8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 16); \
  23512   __ret; \
  23513 })
  23514 #endif
  23515 
  23516 #ifdef __LITTLE_ENDIAN__
  23517 #define vqrshrn_n_s32(__p0, __p1) __extension__ ({ \
  23518   int16x4_t __ret; \
  23519   int32x4_t __s0 = __p0; \
  23520   __ret = (int16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 1); \
  23521   __ret; \
  23522 })
  23523 #else
  23524 #define vqrshrn_n_s32(__p0, __p1) __extension__ ({ \
  23525   int16x4_t __ret; \
  23526   int32x4_t __s0 = __p0; \
  23527   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  23528   __ret = (int16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 1); \
  23529   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  23530   __ret; \
  23531 })
  23532 #define __noswap_vqrshrn_n_s32(__p0, __p1) __extension__ ({ \
  23533   int16x4_t __ret; \
  23534   int32x4_t __s0 = __p0; \
  23535   __ret = (int16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 1); \
  23536   __ret; \
  23537 })
  23538 #endif
  23539 
  23540 #ifdef __LITTLE_ENDIAN__
  23541 #define vqrshrn_n_s64(__p0, __p1) __extension__ ({ \
  23542   int32x2_t __ret; \
  23543   int64x2_t __s0 = __p0; \
  23544   __ret = (int32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 2); \
  23545   __ret; \
  23546 })
  23547 #else
  23548 #define vqrshrn_n_s64(__p0, __p1) __extension__ ({ \
  23549   int32x2_t __ret; \
  23550   int64x2_t __s0 = __p0; \
  23551   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  23552   __ret = (int32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 2); \
  23553   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  23554   __ret; \
  23555 })
  23556 #define __noswap_vqrshrn_n_s64(__p0, __p1) __extension__ ({ \
  23557   int32x2_t __ret; \
  23558   int64x2_t __s0 = __p0; \
  23559   __ret = (int32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 2); \
  23560   __ret; \
  23561 })
  23562 #endif
  23563 
  23564 #ifdef __LITTLE_ENDIAN__
  23565 #define vqrshrn_n_s16(__p0, __p1) __extension__ ({ \
  23566   int8x8_t __ret; \
  23567   int16x8_t __s0 = __p0; \
  23568   __ret = (int8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 0); \
  23569   __ret; \
  23570 })
  23571 #else
  23572 #define vqrshrn_n_s16(__p0, __p1) __extension__ ({ \
  23573   int8x8_t __ret; \
  23574   int16x8_t __s0 = __p0; \
  23575   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  23576   __ret = (int8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 0); \
  23577   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  23578   __ret; \
  23579 })
  23580 #define __noswap_vqrshrn_n_s16(__p0, __p1) __extension__ ({ \
  23581   int8x8_t __ret; \
  23582   int16x8_t __s0 = __p0; \
  23583   __ret = (int8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 0); \
  23584   __ret; \
  23585 })
  23586 #endif
  23587 
  23588 #ifdef __LITTLE_ENDIAN__
  23589 #define vqrshrun_n_s32(__p0, __p1) __extension__ ({ \
  23590   uint16x4_t __ret; \
  23591   int32x4_t __s0 = __p0; \
  23592   __ret = (uint16x4_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 17); \
  23593   __ret; \
  23594 })
  23595 #else
  23596 #define vqrshrun_n_s32(__p0, __p1) __extension__ ({ \
  23597   uint16x4_t __ret; \
  23598   int32x4_t __s0 = __p0; \
  23599   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  23600   __ret = (uint16x4_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__rev0, __p1, 17); \
  23601   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  23602   __ret; \
  23603 })
  23604 #define __noswap_vqrshrun_n_s32(__p0, __p1) __extension__ ({ \
  23605   uint16x4_t __ret; \
  23606   int32x4_t __s0 = __p0; \
  23607   __ret = (uint16x4_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 17); \
  23608   __ret; \
  23609 })
  23610 #endif
  23611 
  23612 #ifdef __LITTLE_ENDIAN__
  23613 #define vqrshrun_n_s64(__p0, __p1) __extension__ ({ \
  23614   uint32x2_t __ret; \
  23615   int64x2_t __s0 = __p0; \
  23616   __ret = (uint32x2_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 18); \
  23617   __ret; \
  23618 })
  23619 #else
  23620 #define vqrshrun_n_s64(__p0, __p1) __extension__ ({ \
  23621   uint32x2_t __ret; \
  23622   int64x2_t __s0 = __p0; \
  23623   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  23624   __ret = (uint32x2_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__rev0, __p1, 18); \
  23625   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  23626   __ret; \
  23627 })
  23628 #define __noswap_vqrshrun_n_s64(__p0, __p1) __extension__ ({ \
  23629   uint32x2_t __ret; \
  23630   int64x2_t __s0 = __p0; \
  23631   __ret = (uint32x2_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 18); \
  23632   __ret; \
  23633 })
  23634 #endif
  23635 
  23636 #ifdef __LITTLE_ENDIAN__
  23637 #define vqrshrun_n_s16(__p0, __p1) __extension__ ({ \
  23638   uint8x8_t __ret; \
  23639   int16x8_t __s0 = __p0; \
  23640   __ret = (uint8x8_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 16); \
  23641   __ret; \
  23642 })
  23643 #else
  23644 #define vqrshrun_n_s16(__p0, __p1) __extension__ ({ \
  23645   uint8x8_t __ret; \
  23646   int16x8_t __s0 = __p0; \
  23647   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  23648   __ret = (uint8x8_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__rev0, __p1, 16); \
  23649   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  23650   __ret; \
  23651 })
  23652 #define __noswap_vqrshrun_n_s16(__p0, __p1) __extension__ ({ \
  23653   uint8x8_t __ret; \
  23654   int16x8_t __s0 = __p0; \
  23655   __ret = (uint8x8_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 16); \
  23656   __ret; \
  23657 })
  23658 #endif
  23659 
  23660 #ifdef __LITTLE_ENDIAN__
  23661 __ai __attribute__((target("neon"))) uint8x16_t vqshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  23662   uint8x16_t __ret;
  23663   __ret = (uint8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  23664   return __ret;
  23665 }
  23666 #else
  23667 __ai __attribute__((target("neon"))) uint8x16_t vqshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  23668   uint8x16_t __ret;
  23669   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23670   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23671   __ret = (uint8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  23672   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23673   return __ret;
  23674 }
  23675 #endif
  23676 
  23677 #ifdef __LITTLE_ENDIAN__
  23678 __ai __attribute__((target("neon"))) uint32x4_t vqshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  23679   uint32x4_t __ret;
  23680   __ret = (uint32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  23681   return __ret;
  23682 }
  23683 #else
  23684 __ai __attribute__((target("neon"))) uint32x4_t vqshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  23685   uint32x4_t __ret;
  23686   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23687   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23688   __ret = (uint32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  23689   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23690   return __ret;
  23691 }
  23692 #endif
  23693 
  23694 #ifdef __LITTLE_ENDIAN__
  23695 __ai __attribute__((target("neon"))) uint64x2_t vqshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  23696   uint64x2_t __ret;
  23697   __ret = (uint64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  23698   return __ret;
  23699 }
  23700 #else
  23701 __ai __attribute__((target("neon"))) uint64x2_t vqshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  23702   uint64x2_t __ret;
  23703   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23704   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23705   __ret = (uint64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  23706   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23707   return __ret;
  23708 }
  23709 #endif
  23710 
  23711 #ifdef __LITTLE_ENDIAN__
  23712 __ai __attribute__((target("neon"))) uint16x8_t vqshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  23713   uint16x8_t __ret;
  23714   __ret = (uint16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  23715   return __ret;
  23716 }
  23717 #else
  23718 __ai __attribute__((target("neon"))) uint16x8_t vqshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  23719   uint16x8_t __ret;
  23720   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23721   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23722   __ret = (uint16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  23723   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23724   return __ret;
  23725 }
  23726 #endif
  23727 
  23728 #ifdef __LITTLE_ENDIAN__
  23729 __ai __attribute__((target("neon"))) int8x16_t vqshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  23730   int8x16_t __ret;
  23731   __ret = (int8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  23732   return __ret;
  23733 }
  23734 #else
  23735 __ai __attribute__((target("neon"))) int8x16_t vqshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  23736   int8x16_t __ret;
  23737   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23738   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23739   __ret = (int8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  23740   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  23741   return __ret;
  23742 }
  23743 #endif
  23744 
  23745 #ifdef __LITTLE_ENDIAN__
  23746 __ai __attribute__((target("neon"))) int32x4_t vqshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  23747   int32x4_t __ret;
  23748   __ret = (int32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  23749   return __ret;
  23750 }
  23751 #else
  23752 __ai __attribute__((target("neon"))) int32x4_t vqshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  23753   int32x4_t __ret;
  23754   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23755   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23756   __ret = (int32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  23757   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23758   return __ret;
  23759 }
  23760 #endif
  23761 
  23762 #ifdef __LITTLE_ENDIAN__
  23763 __ai __attribute__((target("neon"))) int64x2_t vqshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  23764   int64x2_t __ret;
  23765   __ret = (int64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  23766   return __ret;
  23767 }
  23768 #else
  23769 __ai __attribute__((target("neon"))) int64x2_t vqshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  23770   int64x2_t __ret;
  23771   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23772   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23773   __ret = (int64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  23774   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23775   return __ret;
  23776 }
  23777 #endif
  23778 
  23779 #ifdef __LITTLE_ENDIAN__
  23780 __ai __attribute__((target("neon"))) int16x8_t vqshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  23781   int16x8_t __ret;
  23782   __ret = (int16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  23783   return __ret;
  23784 }
  23785 #else
  23786 __ai __attribute__((target("neon"))) int16x8_t vqshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  23787   int16x8_t __ret;
  23788   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23789   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23790   __ret = (int16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  23791   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23792   return __ret;
  23793 }
  23794 #endif
  23795 
  23796 #ifdef __LITTLE_ENDIAN__
  23797 __ai __attribute__((target("neon"))) uint8x8_t vqshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  23798   uint8x8_t __ret;
  23799   __ret = (uint8x8_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  23800   return __ret;
  23801 }
  23802 #else
  23803 __ai __attribute__((target("neon"))) uint8x8_t vqshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  23804   uint8x8_t __ret;
  23805   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23806   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23807   __ret = (uint8x8_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  23808   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23809   return __ret;
  23810 }
  23811 #endif
  23812 
  23813 #ifdef __LITTLE_ENDIAN__
  23814 __ai __attribute__((target("neon"))) uint32x2_t vqshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  23815   uint32x2_t __ret;
  23816   __ret = (uint32x2_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  23817   return __ret;
  23818 }
  23819 #else
  23820 __ai __attribute__((target("neon"))) uint32x2_t vqshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  23821   uint32x2_t __ret;
  23822   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23823   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23824   __ret = (uint32x2_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  23825   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23826   return __ret;
  23827 }
  23828 #endif
  23829 
  23830 __ai __attribute__((target("neon"))) uint64x1_t vqshl_u64(uint64x1_t __p0, int64x1_t __p1) {
  23831   uint64x1_t __ret;
  23832   __ret = (uint64x1_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  23833   return __ret;
  23834 }
  23835 #ifdef __LITTLE_ENDIAN__
  23836 __ai __attribute__((target("neon"))) uint16x4_t vqshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  23837   uint16x4_t __ret;
  23838   __ret = (uint16x4_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  23839   return __ret;
  23840 }
  23841 #else
  23842 __ai __attribute__((target("neon"))) uint16x4_t vqshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  23843   uint16x4_t __ret;
  23844   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23845   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23846   __ret = (uint16x4_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  23847   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23848   return __ret;
  23849 }
  23850 #endif
  23851 
  23852 #ifdef __LITTLE_ENDIAN__
  23853 __ai __attribute__((target("neon"))) int8x8_t vqshl_s8(int8x8_t __p0, int8x8_t __p1) {
  23854   int8x8_t __ret;
  23855   __ret = (int8x8_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  23856   return __ret;
  23857 }
  23858 #else
  23859 __ai __attribute__((target("neon"))) int8x8_t vqshl_s8(int8x8_t __p0, int8x8_t __p1) {
  23860   int8x8_t __ret;
  23861   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  23862   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  23863   __ret = (int8x8_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  23864   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  23865   return __ret;
  23866 }
  23867 #endif
  23868 
  23869 #ifdef __LITTLE_ENDIAN__
  23870 __ai __attribute__((target("neon"))) int32x2_t vqshl_s32(int32x2_t __p0, int32x2_t __p1) {
  23871   int32x2_t __ret;
  23872   __ret = (int32x2_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  23873   return __ret;
  23874 }
  23875 #else
  23876 __ai __attribute__((target("neon"))) int32x2_t vqshl_s32(int32x2_t __p0, int32x2_t __p1) {
  23877   int32x2_t __ret;
  23878   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  23879   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  23880   __ret = (int32x2_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  23881   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  23882   return __ret;
  23883 }
  23884 #endif
  23885 
  23886 __ai __attribute__((target("neon"))) int64x1_t vqshl_s64(int64x1_t __p0, int64x1_t __p1) {
  23887   int64x1_t __ret;
  23888   __ret = (int64x1_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  23889   return __ret;
  23890 }
  23891 #ifdef __LITTLE_ENDIAN__
  23892 __ai __attribute__((target("neon"))) int16x4_t vqshl_s16(int16x4_t __p0, int16x4_t __p1) {
  23893   int16x4_t __ret;
  23894   __ret = (int16x4_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  23895   return __ret;
  23896 }
  23897 #else
  23898 __ai __attribute__((target("neon"))) int16x4_t vqshl_s16(int16x4_t __p0, int16x4_t __p1) {
  23899   int16x4_t __ret;
  23900   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  23901   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  23902   __ret = (int16x4_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  23903   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  23904   return __ret;
  23905 }
  23906 #endif
  23907 
  23908 #ifdef __LITTLE_ENDIAN__
  23909 #define vqshlq_n_u8(__p0, __p1) __extension__ ({ \
  23910   uint8x16_t __ret; \
  23911   uint8x16_t __s0 = __p0; \
  23912   __ret = (uint8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 48); \
  23913   __ret; \
  23914 })
  23915 #else
  23916 #define vqshlq_n_u8(__p0, __p1) __extension__ ({ \
  23917   uint8x16_t __ret; \
  23918   uint8x16_t __s0 = __p0; \
  23919   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  23920   __ret = (uint8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 48); \
  23921   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  23922   __ret; \
  23923 })
  23924 #endif
  23925 
  23926 #ifdef __LITTLE_ENDIAN__
  23927 #define vqshlq_n_u32(__p0, __p1) __extension__ ({ \
  23928   uint32x4_t __ret; \
  23929   uint32x4_t __s0 = __p0; \
  23930   __ret = (uint32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 50); \
  23931   __ret; \
  23932 })
  23933 #else
  23934 #define vqshlq_n_u32(__p0, __p1) __extension__ ({ \
  23935   uint32x4_t __ret; \
  23936   uint32x4_t __s0 = __p0; \
  23937   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  23938   __ret = (uint32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 50); \
  23939   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  23940   __ret; \
  23941 })
  23942 #endif
  23943 
  23944 #ifdef __LITTLE_ENDIAN__
  23945 #define vqshlq_n_u64(__p0, __p1) __extension__ ({ \
  23946   uint64x2_t __ret; \
  23947   uint64x2_t __s0 = __p0; \
  23948   __ret = (uint64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 51); \
  23949   __ret; \
  23950 })
  23951 #else
  23952 #define vqshlq_n_u64(__p0, __p1) __extension__ ({ \
  23953   uint64x2_t __ret; \
  23954   uint64x2_t __s0 = __p0; \
  23955   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  23956   __ret = (uint64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 51); \
  23957   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  23958   __ret; \
  23959 })
  23960 #endif
  23961 
  23962 #ifdef __LITTLE_ENDIAN__
  23963 #define vqshlq_n_u16(__p0, __p1) __extension__ ({ \
  23964   uint16x8_t __ret; \
  23965   uint16x8_t __s0 = __p0; \
  23966   __ret = (uint16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 49); \
  23967   __ret; \
  23968 })
  23969 #else
  23970 #define vqshlq_n_u16(__p0, __p1) __extension__ ({ \
  23971   uint16x8_t __ret; \
  23972   uint16x8_t __s0 = __p0; \
  23973   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  23974   __ret = (uint16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 49); \
  23975   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  23976   __ret; \
  23977 })
  23978 #endif
  23979 
  23980 #ifdef __LITTLE_ENDIAN__
  23981 #define vqshlq_n_s8(__p0, __p1) __extension__ ({ \
  23982   int8x16_t __ret; \
  23983   int8x16_t __s0 = __p0; \
  23984   __ret = (int8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 32); \
  23985   __ret; \
  23986 })
  23987 #else
  23988 #define vqshlq_n_s8(__p0, __p1) __extension__ ({ \
  23989   int8x16_t __ret; \
  23990   int8x16_t __s0 = __p0; \
  23991   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  23992   __ret = (int8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 32); \
  23993   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  23994   __ret; \
  23995 })
  23996 #endif
  23997 
  23998 #ifdef __LITTLE_ENDIAN__
  23999 #define vqshlq_n_s32(__p0, __p1) __extension__ ({ \
  24000   int32x4_t __ret; \
  24001   int32x4_t __s0 = __p0; \
  24002   __ret = (int32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 34); \
  24003   __ret; \
  24004 })
  24005 #else
  24006 #define vqshlq_n_s32(__p0, __p1) __extension__ ({ \
  24007   int32x4_t __ret; \
  24008   int32x4_t __s0 = __p0; \
  24009   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24010   __ret = (int32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 34); \
  24011   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24012   __ret; \
  24013 })
  24014 #endif
  24015 
  24016 #ifdef __LITTLE_ENDIAN__
  24017 #define vqshlq_n_s64(__p0, __p1) __extension__ ({ \
  24018   int64x2_t __ret; \
  24019   int64x2_t __s0 = __p0; \
  24020   __ret = (int64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 35); \
  24021   __ret; \
  24022 })
  24023 #else
  24024 #define vqshlq_n_s64(__p0, __p1) __extension__ ({ \
  24025   int64x2_t __ret; \
  24026   int64x2_t __s0 = __p0; \
  24027   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24028   __ret = (int64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 35); \
  24029   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24030   __ret; \
  24031 })
  24032 #endif
  24033 
  24034 #ifdef __LITTLE_ENDIAN__
  24035 #define vqshlq_n_s16(__p0, __p1) __extension__ ({ \
  24036   int16x8_t __ret; \
  24037   int16x8_t __s0 = __p0; \
  24038   __ret = (int16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 33); \
  24039   __ret; \
  24040 })
  24041 #else
  24042 #define vqshlq_n_s16(__p0, __p1) __extension__ ({ \
  24043   int16x8_t __ret; \
  24044   int16x8_t __s0 = __p0; \
  24045   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24046   __ret = (int16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 33); \
  24047   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24048   __ret; \
  24049 })
  24050 #endif
  24051 
  24052 #ifdef __LITTLE_ENDIAN__
  24053 #define vqshl_n_u8(__p0, __p1) __extension__ ({ \
  24054   uint8x8_t __ret; \
  24055   uint8x8_t __s0 = __p0; \
  24056   __ret = (uint8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 16); \
  24057   __ret; \
  24058 })
  24059 #else
  24060 #define vqshl_n_u8(__p0, __p1) __extension__ ({ \
  24061   uint8x8_t __ret; \
  24062   uint8x8_t __s0 = __p0; \
  24063   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24064   __ret = (uint8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 16); \
  24065   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24066   __ret; \
  24067 })
  24068 #endif
  24069 
  24070 #ifdef __LITTLE_ENDIAN__
  24071 #define vqshl_n_u32(__p0, __p1) __extension__ ({ \
  24072   uint32x2_t __ret; \
  24073   uint32x2_t __s0 = __p0; \
  24074   __ret = (uint32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 18); \
  24075   __ret; \
  24076 })
  24077 #else
  24078 #define vqshl_n_u32(__p0, __p1) __extension__ ({ \
  24079   uint32x2_t __ret; \
  24080   uint32x2_t __s0 = __p0; \
  24081   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24082   __ret = (uint32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 18); \
  24083   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24084   __ret; \
  24085 })
  24086 #endif
  24087 
  24088 #define vqshl_n_u64(__p0, __p1) __extension__ ({ \
  24089   uint64x1_t __ret; \
  24090   uint64x1_t __s0 = __p0; \
  24091   __ret = (uint64x1_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 19); \
  24092   __ret; \
  24093 })
  24094 #ifdef __LITTLE_ENDIAN__
  24095 #define vqshl_n_u16(__p0, __p1) __extension__ ({ \
  24096   uint16x4_t __ret; \
  24097   uint16x4_t __s0 = __p0; \
  24098   __ret = (uint16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 17); \
  24099   __ret; \
  24100 })
  24101 #else
  24102 #define vqshl_n_u16(__p0, __p1) __extension__ ({ \
  24103   uint16x4_t __ret; \
  24104   uint16x4_t __s0 = __p0; \
  24105   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24106   __ret = (uint16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 17); \
  24107   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24108   __ret; \
  24109 })
  24110 #endif
  24111 
  24112 #ifdef __LITTLE_ENDIAN__
  24113 #define vqshl_n_s8(__p0, __p1) __extension__ ({ \
  24114   int8x8_t __ret; \
  24115   int8x8_t __s0 = __p0; \
  24116   __ret = (int8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 0); \
  24117   __ret; \
  24118 })
  24119 #else
  24120 #define vqshl_n_s8(__p0, __p1) __extension__ ({ \
  24121   int8x8_t __ret; \
  24122   int8x8_t __s0 = __p0; \
  24123   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24124   __ret = (int8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 0); \
  24125   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24126   __ret; \
  24127 })
  24128 #endif
  24129 
  24130 #ifdef __LITTLE_ENDIAN__
  24131 #define vqshl_n_s32(__p0, __p1) __extension__ ({ \
  24132   int32x2_t __ret; \
  24133   int32x2_t __s0 = __p0; \
  24134   __ret = (int32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 2); \
  24135   __ret; \
  24136 })
  24137 #else
  24138 #define vqshl_n_s32(__p0, __p1) __extension__ ({ \
  24139   int32x2_t __ret; \
  24140   int32x2_t __s0 = __p0; \
  24141   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24142   __ret = (int32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 2); \
  24143   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24144   __ret; \
  24145 })
  24146 #endif
  24147 
  24148 #define vqshl_n_s64(__p0, __p1) __extension__ ({ \
  24149   int64x1_t __ret; \
  24150   int64x1_t __s0 = __p0; \
  24151   __ret = (int64x1_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 3); \
  24152   __ret; \
  24153 })
  24154 #ifdef __LITTLE_ENDIAN__
  24155 #define vqshl_n_s16(__p0, __p1) __extension__ ({ \
  24156   int16x4_t __ret; \
  24157   int16x4_t __s0 = __p0; \
  24158   __ret = (int16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 1); \
  24159   __ret; \
  24160 })
  24161 #else
  24162 #define vqshl_n_s16(__p0, __p1) __extension__ ({ \
  24163   int16x4_t __ret; \
  24164   int16x4_t __s0 = __p0; \
  24165   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24166   __ret = (int16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 1); \
  24167   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24168   __ret; \
  24169 })
  24170 #endif
  24171 
  24172 #ifdef __LITTLE_ENDIAN__
  24173 #define vqshluq_n_s8(__p0, __p1) __extension__ ({ \
  24174   uint8x16_t __ret; \
  24175   int8x16_t __s0 = __p0; \
  24176   __ret = (uint8x16_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 48); \
  24177   __ret; \
  24178 })
  24179 #else
  24180 #define vqshluq_n_s8(__p0, __p1) __extension__ ({ \
  24181   uint8x16_t __ret; \
  24182   int8x16_t __s0 = __p0; \
  24183   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  24184   __ret = (uint8x16_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 48); \
  24185   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  24186   __ret; \
  24187 })
  24188 #endif
  24189 
  24190 #ifdef __LITTLE_ENDIAN__
  24191 #define vqshluq_n_s32(__p0, __p1) __extension__ ({ \
  24192   uint32x4_t __ret; \
  24193   int32x4_t __s0 = __p0; \
  24194   __ret = (uint32x4_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 50); \
  24195   __ret; \
  24196 })
  24197 #else
  24198 #define vqshluq_n_s32(__p0, __p1) __extension__ ({ \
  24199   uint32x4_t __ret; \
  24200   int32x4_t __s0 = __p0; \
  24201   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24202   __ret = (uint32x4_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 50); \
  24203   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24204   __ret; \
  24205 })
  24206 #endif
  24207 
  24208 #ifdef __LITTLE_ENDIAN__
  24209 #define vqshluq_n_s64(__p0, __p1) __extension__ ({ \
  24210   uint64x2_t __ret; \
  24211   int64x2_t __s0 = __p0; \
  24212   __ret = (uint64x2_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 51); \
  24213   __ret; \
  24214 })
  24215 #else
  24216 #define vqshluq_n_s64(__p0, __p1) __extension__ ({ \
  24217   uint64x2_t __ret; \
  24218   int64x2_t __s0 = __p0; \
  24219   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24220   __ret = (uint64x2_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 51); \
  24221   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24222   __ret; \
  24223 })
  24224 #endif
  24225 
  24226 #ifdef __LITTLE_ENDIAN__
  24227 #define vqshluq_n_s16(__p0, __p1) __extension__ ({ \
  24228   uint16x8_t __ret; \
  24229   int16x8_t __s0 = __p0; \
  24230   __ret = (uint16x8_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 49); \
  24231   __ret; \
  24232 })
  24233 #else
  24234 #define vqshluq_n_s16(__p0, __p1) __extension__ ({ \
  24235   uint16x8_t __ret; \
  24236   int16x8_t __s0 = __p0; \
  24237   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24238   __ret = (uint16x8_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 49); \
  24239   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24240   __ret; \
  24241 })
  24242 #endif
  24243 
  24244 #ifdef __LITTLE_ENDIAN__
  24245 #define vqshlu_n_s8(__p0, __p1) __extension__ ({ \
  24246   uint8x8_t __ret; \
  24247   int8x8_t __s0 = __p0; \
  24248   __ret = (uint8x8_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 16); \
  24249   __ret; \
  24250 })
  24251 #else
  24252 #define vqshlu_n_s8(__p0, __p1) __extension__ ({ \
  24253   uint8x8_t __ret; \
  24254   int8x8_t __s0 = __p0; \
  24255   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24256   __ret = (uint8x8_t) __builtin_neon_vqshlu_n_v((int8x8_t)__rev0, __p1, 16); \
  24257   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24258   __ret; \
  24259 })
  24260 #endif
  24261 
  24262 #ifdef __LITTLE_ENDIAN__
  24263 #define vqshlu_n_s32(__p0, __p1) __extension__ ({ \
  24264   uint32x2_t __ret; \
  24265   int32x2_t __s0 = __p0; \
  24266   __ret = (uint32x2_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 18); \
  24267   __ret; \
  24268 })
  24269 #else
  24270 #define vqshlu_n_s32(__p0, __p1) __extension__ ({ \
  24271   uint32x2_t __ret; \
  24272   int32x2_t __s0 = __p0; \
  24273   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24274   __ret = (uint32x2_t) __builtin_neon_vqshlu_n_v((int8x8_t)__rev0, __p1, 18); \
  24275   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24276   __ret; \
  24277 })
  24278 #endif
  24279 
  24280 #define vqshlu_n_s64(__p0, __p1) __extension__ ({ \
  24281   uint64x1_t __ret; \
  24282   int64x1_t __s0 = __p0; \
  24283   __ret = (uint64x1_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 19); \
  24284   __ret; \
  24285 })
  24286 #ifdef __LITTLE_ENDIAN__
  24287 #define vqshlu_n_s16(__p0, __p1) __extension__ ({ \
  24288   uint16x4_t __ret; \
  24289   int16x4_t __s0 = __p0; \
  24290   __ret = (uint16x4_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 17); \
  24291   __ret; \
  24292 })
  24293 #else
  24294 #define vqshlu_n_s16(__p0, __p1) __extension__ ({ \
  24295   uint16x4_t __ret; \
  24296   int16x4_t __s0 = __p0; \
  24297   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24298   __ret = (uint16x4_t) __builtin_neon_vqshlu_n_v((int8x8_t)__rev0, __p1, 17); \
  24299   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24300   __ret; \
  24301 })
  24302 #endif
  24303 
  24304 #ifdef __LITTLE_ENDIAN__
  24305 #define vqshrn_n_u32(__p0, __p1) __extension__ ({ \
  24306   uint16x4_t __ret; \
  24307   uint32x4_t __s0 = __p0; \
  24308   __ret = (uint16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 17); \
  24309   __ret; \
  24310 })
  24311 #else
  24312 #define vqshrn_n_u32(__p0, __p1) __extension__ ({ \
  24313   uint16x4_t __ret; \
  24314   uint32x4_t __s0 = __p0; \
  24315   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24316   __ret = (uint16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 17); \
  24317   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24318   __ret; \
  24319 })
  24320 #define __noswap_vqshrn_n_u32(__p0, __p1) __extension__ ({ \
  24321   uint16x4_t __ret; \
  24322   uint32x4_t __s0 = __p0; \
  24323   __ret = (uint16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 17); \
  24324   __ret; \
  24325 })
  24326 #endif
  24327 
  24328 #ifdef __LITTLE_ENDIAN__
  24329 #define vqshrn_n_u64(__p0, __p1) __extension__ ({ \
  24330   uint32x2_t __ret; \
  24331   uint64x2_t __s0 = __p0; \
  24332   __ret = (uint32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 18); \
  24333   __ret; \
  24334 })
  24335 #else
  24336 #define vqshrn_n_u64(__p0, __p1) __extension__ ({ \
  24337   uint32x2_t __ret; \
  24338   uint64x2_t __s0 = __p0; \
  24339   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24340   __ret = (uint32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 18); \
  24341   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24342   __ret; \
  24343 })
  24344 #define __noswap_vqshrn_n_u64(__p0, __p1) __extension__ ({ \
  24345   uint32x2_t __ret; \
  24346   uint64x2_t __s0 = __p0; \
  24347   __ret = (uint32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 18); \
  24348   __ret; \
  24349 })
  24350 #endif
  24351 
  24352 #ifdef __LITTLE_ENDIAN__
  24353 #define vqshrn_n_u16(__p0, __p1) __extension__ ({ \
  24354   uint8x8_t __ret; \
  24355   uint16x8_t __s0 = __p0; \
  24356   __ret = (uint8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 16); \
  24357   __ret; \
  24358 })
  24359 #else
  24360 #define vqshrn_n_u16(__p0, __p1) __extension__ ({ \
  24361   uint8x8_t __ret; \
  24362   uint16x8_t __s0 = __p0; \
  24363   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24364   __ret = (uint8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 16); \
  24365   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24366   __ret; \
  24367 })
  24368 #define __noswap_vqshrn_n_u16(__p0, __p1) __extension__ ({ \
  24369   uint8x8_t __ret; \
  24370   uint16x8_t __s0 = __p0; \
  24371   __ret = (uint8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 16); \
  24372   __ret; \
  24373 })
  24374 #endif
  24375 
  24376 #ifdef __LITTLE_ENDIAN__
  24377 #define vqshrn_n_s32(__p0, __p1) __extension__ ({ \
  24378   int16x4_t __ret; \
  24379   int32x4_t __s0 = __p0; \
  24380   __ret = (int16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 1); \
  24381   __ret; \
  24382 })
  24383 #else
  24384 #define vqshrn_n_s32(__p0, __p1) __extension__ ({ \
  24385   int16x4_t __ret; \
  24386   int32x4_t __s0 = __p0; \
  24387   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24388   __ret = (int16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 1); \
  24389   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24390   __ret; \
  24391 })
  24392 #define __noswap_vqshrn_n_s32(__p0, __p1) __extension__ ({ \
  24393   int16x4_t __ret; \
  24394   int32x4_t __s0 = __p0; \
  24395   __ret = (int16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 1); \
  24396   __ret; \
  24397 })
  24398 #endif
  24399 
  24400 #ifdef __LITTLE_ENDIAN__
  24401 #define vqshrn_n_s64(__p0, __p1) __extension__ ({ \
  24402   int32x2_t __ret; \
  24403   int64x2_t __s0 = __p0; \
  24404   __ret = (int32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 2); \
  24405   __ret; \
  24406 })
  24407 #else
  24408 #define vqshrn_n_s64(__p0, __p1) __extension__ ({ \
  24409   int32x2_t __ret; \
  24410   int64x2_t __s0 = __p0; \
  24411   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24412   __ret = (int32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 2); \
  24413   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24414   __ret; \
  24415 })
  24416 #define __noswap_vqshrn_n_s64(__p0, __p1) __extension__ ({ \
  24417   int32x2_t __ret; \
  24418   int64x2_t __s0 = __p0; \
  24419   __ret = (int32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 2); \
  24420   __ret; \
  24421 })
  24422 #endif
  24423 
  24424 #ifdef __LITTLE_ENDIAN__
  24425 #define vqshrn_n_s16(__p0, __p1) __extension__ ({ \
  24426   int8x8_t __ret; \
  24427   int16x8_t __s0 = __p0; \
  24428   __ret = (int8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 0); \
  24429   __ret; \
  24430 })
  24431 #else
  24432 #define vqshrn_n_s16(__p0, __p1) __extension__ ({ \
  24433   int8x8_t __ret; \
  24434   int16x8_t __s0 = __p0; \
  24435   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24436   __ret = (int8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 0); \
  24437   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24438   __ret; \
  24439 })
  24440 #define __noswap_vqshrn_n_s16(__p0, __p1) __extension__ ({ \
  24441   int8x8_t __ret; \
  24442   int16x8_t __s0 = __p0; \
  24443   __ret = (int8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 0); \
  24444   __ret; \
  24445 })
  24446 #endif
  24447 
  24448 #ifdef __LITTLE_ENDIAN__
  24449 #define vqshrun_n_s32(__p0, __p1) __extension__ ({ \
  24450   uint16x4_t __ret; \
  24451   int32x4_t __s0 = __p0; \
  24452   __ret = (uint16x4_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 17); \
  24453   __ret; \
  24454 })
  24455 #else
  24456 #define vqshrun_n_s32(__p0, __p1) __extension__ ({ \
  24457   uint16x4_t __ret; \
  24458   int32x4_t __s0 = __p0; \
  24459   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  24460   __ret = (uint16x4_t) __builtin_neon_vqshrun_n_v((int8x16_t)__rev0, __p1, 17); \
  24461   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  24462   __ret; \
  24463 })
  24464 #define __noswap_vqshrun_n_s32(__p0, __p1) __extension__ ({ \
  24465   uint16x4_t __ret; \
  24466   int32x4_t __s0 = __p0; \
  24467   __ret = (uint16x4_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 17); \
  24468   __ret; \
  24469 })
  24470 #endif
  24471 
  24472 #ifdef __LITTLE_ENDIAN__
  24473 #define vqshrun_n_s64(__p0, __p1) __extension__ ({ \
  24474   uint32x2_t __ret; \
  24475   int64x2_t __s0 = __p0; \
  24476   __ret = (uint32x2_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 18); \
  24477   __ret; \
  24478 })
  24479 #else
  24480 #define vqshrun_n_s64(__p0, __p1) __extension__ ({ \
  24481   uint32x2_t __ret; \
  24482   int64x2_t __s0 = __p0; \
  24483   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  24484   __ret = (uint32x2_t) __builtin_neon_vqshrun_n_v((int8x16_t)__rev0, __p1, 18); \
  24485   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  24486   __ret; \
  24487 })
  24488 #define __noswap_vqshrun_n_s64(__p0, __p1) __extension__ ({ \
  24489   uint32x2_t __ret; \
  24490   int64x2_t __s0 = __p0; \
  24491   __ret = (uint32x2_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 18); \
  24492   __ret; \
  24493 })
  24494 #endif
  24495 
  24496 #ifdef __LITTLE_ENDIAN__
  24497 #define vqshrun_n_s16(__p0, __p1) __extension__ ({ \
  24498   uint8x8_t __ret; \
  24499   int16x8_t __s0 = __p0; \
  24500   __ret = (uint8x8_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 16); \
  24501   __ret; \
  24502 })
  24503 #else
  24504 #define vqshrun_n_s16(__p0, __p1) __extension__ ({ \
  24505   uint8x8_t __ret; \
  24506   int16x8_t __s0 = __p0; \
  24507   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  24508   __ret = (uint8x8_t) __builtin_neon_vqshrun_n_v((int8x16_t)__rev0, __p1, 16); \
  24509   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  24510   __ret; \
  24511 })
  24512 #define __noswap_vqshrun_n_s16(__p0, __p1) __extension__ ({ \
  24513   uint8x8_t __ret; \
  24514   int16x8_t __s0 = __p0; \
  24515   __ret = (uint8x8_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 16); \
  24516   __ret; \
  24517 })
  24518 #endif
  24519 
  24520 #ifdef __LITTLE_ENDIAN__
  24521 __ai __attribute__((target("neon"))) uint8x16_t vqsubq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  24522   uint8x16_t __ret;
  24523   __ret = (uint8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  24524   return __ret;
  24525 }
  24526 #else
  24527 __ai __attribute__((target("neon"))) uint8x16_t vqsubq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  24528   uint8x16_t __ret;
  24529   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  24530   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  24531   __ret = (uint8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  24532   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  24533   return __ret;
  24534 }
  24535 #endif
  24536 
  24537 #ifdef __LITTLE_ENDIAN__
  24538 __ai __attribute__((target("neon"))) uint32x4_t vqsubq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  24539   uint32x4_t __ret;
  24540   __ret = (uint32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  24541   return __ret;
  24542 }
  24543 #else
  24544 __ai __attribute__((target("neon"))) uint32x4_t vqsubq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  24545   uint32x4_t __ret;
  24546   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24547   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24548   __ret = (uint32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  24549   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24550   return __ret;
  24551 }
  24552 #endif
  24553 
  24554 #ifdef __LITTLE_ENDIAN__
  24555 __ai __attribute__((target("neon"))) uint64x2_t vqsubq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  24556   uint64x2_t __ret;
  24557   __ret = (uint64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  24558   return __ret;
  24559 }
  24560 #else
  24561 __ai __attribute__((target("neon"))) uint64x2_t vqsubq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  24562   uint64x2_t __ret;
  24563   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24564   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24565   __ret = (uint64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  24566   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24567   return __ret;
  24568 }
  24569 #endif
  24570 
  24571 #ifdef __LITTLE_ENDIAN__
  24572 __ai __attribute__((target("neon"))) uint16x8_t vqsubq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  24573   uint16x8_t __ret;
  24574   __ret = (uint16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  24575   return __ret;
  24576 }
  24577 #else
  24578 __ai __attribute__((target("neon"))) uint16x8_t vqsubq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  24579   uint16x8_t __ret;
  24580   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  24581   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  24582   __ret = (uint16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  24583   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  24584   return __ret;
  24585 }
  24586 #endif
  24587 
  24588 #ifdef __LITTLE_ENDIAN__
  24589 __ai __attribute__((target("neon"))) int8x16_t vqsubq_s8(int8x16_t __p0, int8x16_t __p1) {
  24590   int8x16_t __ret;
  24591   __ret = (int8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  24592   return __ret;
  24593 }
  24594 #else
  24595 __ai __attribute__((target("neon"))) int8x16_t vqsubq_s8(int8x16_t __p0, int8x16_t __p1) {
  24596   int8x16_t __ret;
  24597   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  24598   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  24599   __ret = (int8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  24600   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  24601   return __ret;
  24602 }
  24603 #endif
  24604 
  24605 #ifdef __LITTLE_ENDIAN__
  24606 __ai __attribute__((target("neon"))) int32x4_t vqsubq_s32(int32x4_t __p0, int32x4_t __p1) {
  24607   int32x4_t __ret;
  24608   __ret = (int32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  24609   return __ret;
  24610 }
  24611 #else
  24612 __ai __attribute__((target("neon"))) int32x4_t vqsubq_s32(int32x4_t __p0, int32x4_t __p1) {
  24613   int32x4_t __ret;
  24614   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24615   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24616   __ret = (int32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  24617   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24618   return __ret;
  24619 }
  24620 #endif
  24621 
  24622 #ifdef __LITTLE_ENDIAN__
  24623 __ai __attribute__((target("neon"))) int64x2_t vqsubq_s64(int64x2_t __p0, int64x2_t __p1) {
  24624   int64x2_t __ret;
  24625   __ret = (int64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  24626   return __ret;
  24627 }
  24628 #else
  24629 __ai __attribute__((target("neon"))) int64x2_t vqsubq_s64(int64x2_t __p0, int64x2_t __p1) {
  24630   int64x2_t __ret;
  24631   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24632   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24633   __ret = (int64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  24634   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24635   return __ret;
  24636 }
  24637 #endif
  24638 
  24639 #ifdef __LITTLE_ENDIAN__
  24640 __ai __attribute__((target("neon"))) int16x8_t vqsubq_s16(int16x8_t __p0, int16x8_t __p1) {
  24641   int16x8_t __ret;
  24642   __ret = (int16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  24643   return __ret;
  24644 }
  24645 #else
  24646 __ai __attribute__((target("neon"))) int16x8_t vqsubq_s16(int16x8_t __p0, int16x8_t __p1) {
  24647   int16x8_t __ret;
  24648   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  24649   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  24650   __ret = (int16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  24651   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  24652   return __ret;
  24653 }
  24654 #endif
  24655 
  24656 #ifdef __LITTLE_ENDIAN__
  24657 __ai __attribute__((target("neon"))) uint8x8_t vqsub_u8(uint8x8_t __p0, uint8x8_t __p1) {
  24658   uint8x8_t __ret;
  24659   __ret = (uint8x8_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  24660   return __ret;
  24661 }
  24662 #else
  24663 __ai __attribute__((target("neon"))) uint8x8_t vqsub_u8(uint8x8_t __p0, uint8x8_t __p1) {
  24664   uint8x8_t __ret;
  24665   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  24666   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  24667   __ret = (uint8x8_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  24668   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  24669   return __ret;
  24670 }
  24671 #endif
  24672 
  24673 #ifdef __LITTLE_ENDIAN__
  24674 __ai __attribute__((target("neon"))) uint32x2_t vqsub_u32(uint32x2_t __p0, uint32x2_t __p1) {
  24675   uint32x2_t __ret;
  24676   __ret = (uint32x2_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  24677   return __ret;
  24678 }
  24679 #else
  24680 __ai __attribute__((target("neon"))) uint32x2_t vqsub_u32(uint32x2_t __p0, uint32x2_t __p1) {
  24681   uint32x2_t __ret;
  24682   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24683   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24684   __ret = (uint32x2_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  24685   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24686   return __ret;
  24687 }
  24688 #endif
  24689 
  24690 __ai __attribute__((target("neon"))) uint64x1_t vqsub_u64(uint64x1_t __p0, uint64x1_t __p1) {
  24691   uint64x1_t __ret;
  24692   __ret = (uint64x1_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  24693   return __ret;
  24694 }
  24695 #ifdef __LITTLE_ENDIAN__
  24696 __ai __attribute__((target("neon"))) uint16x4_t vqsub_u16(uint16x4_t __p0, uint16x4_t __p1) {
  24697   uint16x4_t __ret;
  24698   __ret = (uint16x4_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  24699   return __ret;
  24700 }
  24701 #else
  24702 __ai __attribute__((target("neon"))) uint16x4_t vqsub_u16(uint16x4_t __p0, uint16x4_t __p1) {
  24703   uint16x4_t __ret;
  24704   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24705   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24706   __ret = (uint16x4_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  24707   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24708   return __ret;
  24709 }
  24710 #endif
  24711 
  24712 #ifdef __LITTLE_ENDIAN__
  24713 __ai __attribute__((target("neon"))) int8x8_t vqsub_s8(int8x8_t __p0, int8x8_t __p1) {
  24714   int8x8_t __ret;
  24715   __ret = (int8x8_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  24716   return __ret;
  24717 }
  24718 #else
  24719 __ai __attribute__((target("neon"))) int8x8_t vqsub_s8(int8x8_t __p0, int8x8_t __p1) {
  24720   int8x8_t __ret;
  24721   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  24722   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  24723   __ret = (int8x8_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  24724   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  24725   return __ret;
  24726 }
  24727 #endif
  24728 
  24729 #ifdef __LITTLE_ENDIAN__
  24730 __ai __attribute__((target("neon"))) int32x2_t vqsub_s32(int32x2_t __p0, int32x2_t __p1) {
  24731   int32x2_t __ret;
  24732   __ret = (int32x2_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  24733   return __ret;
  24734 }
  24735 #else
  24736 __ai __attribute__((target("neon"))) int32x2_t vqsub_s32(int32x2_t __p0, int32x2_t __p1) {
  24737   int32x2_t __ret;
  24738   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24739   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24740   __ret = (int32x2_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  24741   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24742   return __ret;
  24743 }
  24744 #endif
  24745 
  24746 __ai __attribute__((target("neon"))) int64x1_t vqsub_s64(int64x1_t __p0, int64x1_t __p1) {
  24747   int64x1_t __ret;
  24748   __ret = (int64x1_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  24749   return __ret;
  24750 }
  24751 #ifdef __LITTLE_ENDIAN__
  24752 __ai __attribute__((target("neon"))) int16x4_t vqsub_s16(int16x4_t __p0, int16x4_t __p1) {
  24753   int16x4_t __ret;
  24754   __ret = (int16x4_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  24755   return __ret;
  24756 }
  24757 #else
  24758 __ai __attribute__((target("neon"))) int16x4_t vqsub_s16(int16x4_t __p0, int16x4_t __p1) {
  24759   int16x4_t __ret;
  24760   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24761   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24762   __ret = (int16x4_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  24763   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24764   return __ret;
  24765 }
  24766 #endif
  24767 
  24768 #ifdef __LITTLE_ENDIAN__
  24769 __ai __attribute__((target("neon"))) uint16x4_t vraddhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  24770   uint16x4_t __ret;
  24771   __ret = (uint16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
  24772   return __ret;
  24773 }
  24774 #else
  24775 __ai __attribute__((target("neon"))) uint16x4_t vraddhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  24776   uint16x4_t __ret;
  24777   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24778   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24779   __ret = (uint16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17);
  24780   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24781   return __ret;
  24782 }
  24783 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vraddhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  24784   uint16x4_t __ret;
  24785   __ret = (uint16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
  24786   return __ret;
  24787 }
  24788 #endif
  24789 
  24790 #ifdef __LITTLE_ENDIAN__
  24791 __ai __attribute__((target("neon"))) uint32x2_t vraddhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  24792   uint32x2_t __ret;
  24793   __ret = (uint32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
  24794   return __ret;
  24795 }
  24796 #else
  24797 __ai __attribute__((target("neon"))) uint32x2_t vraddhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  24798   uint32x2_t __ret;
  24799   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24800   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24801   __ret = (uint32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18);
  24802   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24803   return __ret;
  24804 }
  24805 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vraddhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  24806   uint32x2_t __ret;
  24807   __ret = (uint32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
  24808   return __ret;
  24809 }
  24810 #endif
  24811 
  24812 #ifdef __LITTLE_ENDIAN__
  24813 __ai __attribute__((target("neon"))) uint8x8_t vraddhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  24814   uint8x8_t __ret;
  24815   __ret = (uint8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
  24816   return __ret;
  24817 }
  24818 #else
  24819 __ai __attribute__((target("neon"))) uint8x8_t vraddhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  24820   uint8x8_t __ret;
  24821   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  24822   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  24823   __ret = (uint8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16);
  24824   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  24825   return __ret;
  24826 }
  24827 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vraddhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  24828   uint8x8_t __ret;
  24829   __ret = (uint8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
  24830   return __ret;
  24831 }
  24832 #endif
  24833 
  24834 #ifdef __LITTLE_ENDIAN__
  24835 __ai __attribute__((target("neon"))) int16x4_t vraddhn_s32(int32x4_t __p0, int32x4_t __p1) {
  24836   int16x4_t __ret;
  24837   __ret = (int16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
  24838   return __ret;
  24839 }
  24840 #else
  24841 __ai __attribute__((target("neon"))) int16x4_t vraddhn_s32(int32x4_t __p0, int32x4_t __p1) {
  24842   int16x4_t __ret;
  24843   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24844   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24845   __ret = (int16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1);
  24846   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24847   return __ret;
  24848 }
  24849 __ai __attribute__((target("neon"))) int16x4_t __noswap_vraddhn_s32(int32x4_t __p0, int32x4_t __p1) {
  24850   int16x4_t __ret;
  24851   __ret = (int16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
  24852   return __ret;
  24853 }
  24854 #endif
  24855 
  24856 #ifdef __LITTLE_ENDIAN__
  24857 __ai __attribute__((target("neon"))) int32x2_t vraddhn_s64(int64x2_t __p0, int64x2_t __p1) {
  24858   int32x2_t __ret;
  24859   __ret = (int32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
  24860   return __ret;
  24861 }
  24862 #else
  24863 __ai __attribute__((target("neon"))) int32x2_t vraddhn_s64(int64x2_t __p0, int64x2_t __p1) {
  24864   int32x2_t __ret;
  24865   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24866   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24867   __ret = (int32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2);
  24868   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24869   return __ret;
  24870 }
  24871 __ai __attribute__((target("neon"))) int32x2_t __noswap_vraddhn_s64(int64x2_t __p0, int64x2_t __p1) {
  24872   int32x2_t __ret;
  24873   __ret = (int32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
  24874   return __ret;
  24875 }
  24876 #endif
  24877 
  24878 #ifdef __LITTLE_ENDIAN__
  24879 __ai __attribute__((target("neon"))) int8x8_t vraddhn_s16(int16x8_t __p0, int16x8_t __p1) {
  24880   int8x8_t __ret;
  24881   __ret = (int8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
  24882   return __ret;
  24883 }
  24884 #else
  24885 __ai __attribute__((target("neon"))) int8x8_t vraddhn_s16(int16x8_t __p0, int16x8_t __p1) {
  24886   int8x8_t __ret;
  24887   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  24888   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  24889   __ret = (int8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0);
  24890   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  24891   return __ret;
  24892 }
  24893 __ai __attribute__((target("neon"))) int8x8_t __noswap_vraddhn_s16(int16x8_t __p0, int16x8_t __p1) {
  24894   int8x8_t __ret;
  24895   __ret = (int8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
  24896   return __ret;
  24897 }
  24898 #endif
  24899 
  24900 #ifdef __LITTLE_ENDIAN__
  24901 __ai __attribute__((target("neon"))) uint32x4_t vrecpeq_u32(uint32x4_t __p0) {
  24902   uint32x4_t __ret;
  24903   __ret = (uint32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__p0, 50);
  24904   return __ret;
  24905 }
  24906 #else
  24907 __ai __attribute__((target("neon"))) uint32x4_t vrecpeq_u32(uint32x4_t __p0) {
  24908   uint32x4_t __ret;
  24909   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24910   __ret = (uint32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__rev0, 50);
  24911   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24912   return __ret;
  24913 }
  24914 #endif
  24915 
  24916 #ifdef __LITTLE_ENDIAN__
  24917 __ai __attribute__((target("neon"))) float32x4_t vrecpeq_f32(float32x4_t __p0) {
  24918   float32x4_t __ret;
  24919   __ret = (float32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__p0, 41);
  24920   return __ret;
  24921 }
  24922 #else
  24923 __ai __attribute__((target("neon"))) float32x4_t vrecpeq_f32(float32x4_t __p0) {
  24924   float32x4_t __ret;
  24925   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24926   __ret = (float32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__rev0, 41);
  24927   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24928   return __ret;
  24929 }
  24930 #endif
  24931 
  24932 #ifdef __LITTLE_ENDIAN__
  24933 __ai __attribute__((target("neon"))) uint32x2_t vrecpe_u32(uint32x2_t __p0) {
  24934   uint32x2_t __ret;
  24935   __ret = (uint32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__p0, 18);
  24936   return __ret;
  24937 }
  24938 #else
  24939 __ai __attribute__((target("neon"))) uint32x2_t vrecpe_u32(uint32x2_t __p0) {
  24940   uint32x2_t __ret;
  24941   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24942   __ret = (uint32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__rev0, 18);
  24943   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24944   return __ret;
  24945 }
  24946 #endif
  24947 
  24948 #ifdef __LITTLE_ENDIAN__
  24949 __ai __attribute__((target("neon"))) float32x2_t vrecpe_f32(float32x2_t __p0) {
  24950   float32x2_t __ret;
  24951   __ret = (float32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__p0, 9);
  24952   return __ret;
  24953 }
  24954 #else
  24955 __ai __attribute__((target("neon"))) float32x2_t vrecpe_f32(float32x2_t __p0) {
  24956   float32x2_t __ret;
  24957   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24958   __ret = (float32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__rev0, 9);
  24959   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24960   return __ret;
  24961 }
  24962 #endif
  24963 
  24964 #ifdef __LITTLE_ENDIAN__
  24965 __ai __attribute__((target("neon"))) float32x4_t vrecpsq_f32(float32x4_t __p0, float32x4_t __p1) {
  24966   float32x4_t __ret;
  24967   __ret = (float32x4_t) __builtin_neon_vrecpsq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  24968   return __ret;
  24969 }
  24970 #else
  24971 __ai __attribute__((target("neon"))) float32x4_t vrecpsq_f32(float32x4_t __p0, float32x4_t __p1) {
  24972   float32x4_t __ret;
  24973   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  24974   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  24975   __ret = (float32x4_t) __builtin_neon_vrecpsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  24976   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  24977   return __ret;
  24978 }
  24979 #endif
  24980 
  24981 #ifdef __LITTLE_ENDIAN__
  24982 __ai __attribute__((target("neon"))) float32x2_t vrecps_f32(float32x2_t __p0, float32x2_t __p1) {
  24983   float32x2_t __ret;
  24984   __ret = (float32x2_t) __builtin_neon_vrecps_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  24985   return __ret;
  24986 }
  24987 #else
  24988 __ai __attribute__((target("neon"))) float32x2_t vrecps_f32(float32x2_t __p0, float32x2_t __p1) {
  24989   float32x2_t __ret;
  24990   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  24991   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  24992   __ret = (float32x2_t) __builtin_neon_vrecps_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  24993   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  24994   return __ret;
  24995 }
  24996 #endif
  24997 
  24998 #ifdef __LITTLE_ENDIAN__
  24999 __ai __attribute__((target("neon"))) poly8x8_t vrev16_p8(poly8x8_t __p0) {
  25000   poly8x8_t __ret;
  25001   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6);
  25002   return __ret;
  25003 }
  25004 #else
  25005 __ai __attribute__((target("neon"))) poly8x8_t vrev16_p8(poly8x8_t __p0) {
  25006   poly8x8_t __ret;
  25007   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25008   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6);
  25009   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25010   return __ret;
  25011 }
  25012 #endif
  25013 
  25014 #ifdef __LITTLE_ENDIAN__
  25015 __ai __attribute__((target("neon"))) poly8x16_t vrev16q_p8(poly8x16_t __p0) {
  25016   poly8x16_t __ret;
  25017   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14);
  25018   return __ret;
  25019 }
  25020 #else
  25021 __ai __attribute__((target("neon"))) poly8x16_t vrev16q_p8(poly8x16_t __p0) {
  25022   poly8x16_t __ret;
  25023   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25024   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14);
  25025   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25026   return __ret;
  25027 }
  25028 #endif
  25029 
  25030 #ifdef __LITTLE_ENDIAN__
  25031 __ai __attribute__((target("neon"))) uint8x16_t vrev16q_u8(uint8x16_t __p0) {
  25032   uint8x16_t __ret;
  25033   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14);
  25034   return __ret;
  25035 }
  25036 #else
  25037 __ai __attribute__((target("neon"))) uint8x16_t vrev16q_u8(uint8x16_t __p0) {
  25038   uint8x16_t __ret;
  25039   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25040   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14);
  25041   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25042   return __ret;
  25043 }
  25044 #endif
  25045 
  25046 #ifdef __LITTLE_ENDIAN__
  25047 __ai __attribute__((target("neon"))) int8x16_t vrev16q_s8(int8x16_t __p0) {
  25048   int8x16_t __ret;
  25049   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14);
  25050   return __ret;
  25051 }
  25052 #else
  25053 __ai __attribute__((target("neon"))) int8x16_t vrev16q_s8(int8x16_t __p0) {
  25054   int8x16_t __ret;
  25055   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25056   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14);
  25057   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25058   return __ret;
  25059 }
  25060 #endif
  25061 
  25062 #ifdef __LITTLE_ENDIAN__
  25063 __ai __attribute__((target("neon"))) uint8x8_t vrev16_u8(uint8x8_t __p0) {
  25064   uint8x8_t __ret;
  25065   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6);
  25066   return __ret;
  25067 }
  25068 #else
  25069 __ai __attribute__((target("neon"))) uint8x8_t vrev16_u8(uint8x8_t __p0) {
  25070   uint8x8_t __ret;
  25071   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25072   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6);
  25073   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25074   return __ret;
  25075 }
  25076 #endif
  25077 
  25078 #ifdef __LITTLE_ENDIAN__
  25079 __ai __attribute__((target("neon"))) int8x8_t vrev16_s8(int8x8_t __p0) {
  25080   int8x8_t __ret;
  25081   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6);
  25082   return __ret;
  25083 }
  25084 #else
  25085 __ai __attribute__((target("neon"))) int8x8_t vrev16_s8(int8x8_t __p0) {
  25086   int8x8_t __ret;
  25087   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25088   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6);
  25089   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25090   return __ret;
  25091 }
  25092 #endif
  25093 
  25094 #ifdef __LITTLE_ENDIAN__
  25095 __ai __attribute__((target("neon"))) poly8x8_t vrev32_p8(poly8x8_t __p0) {
  25096   poly8x8_t __ret;
  25097   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25098   return __ret;
  25099 }
  25100 #else
  25101 __ai __attribute__((target("neon"))) poly8x8_t vrev32_p8(poly8x8_t __p0) {
  25102   poly8x8_t __ret;
  25103   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25104   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25105   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25106   return __ret;
  25107 }
  25108 #endif
  25109 
  25110 #ifdef __LITTLE_ENDIAN__
  25111 __ai __attribute__((target("neon"))) poly16x4_t vrev32_p16(poly16x4_t __p0) {
  25112   poly16x4_t __ret;
  25113   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2);
  25114   return __ret;
  25115 }
  25116 #else
  25117 __ai __attribute__((target("neon"))) poly16x4_t vrev32_p16(poly16x4_t __p0) {
  25118   poly16x4_t __ret;
  25119   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25120   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2);
  25121   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25122   return __ret;
  25123 }
  25124 #endif
  25125 
  25126 #ifdef __LITTLE_ENDIAN__
  25127 __ai __attribute__((target("neon"))) poly8x16_t vrev32q_p8(poly8x16_t __p0) {
  25128   poly8x16_t __ret;
  25129   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12);
  25130   return __ret;
  25131 }
  25132 #else
  25133 __ai __attribute__((target("neon"))) poly8x16_t vrev32q_p8(poly8x16_t __p0) {
  25134   poly8x16_t __ret;
  25135   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25136   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12);
  25137   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25138   return __ret;
  25139 }
  25140 #endif
  25141 
  25142 #ifdef __LITTLE_ENDIAN__
  25143 __ai __attribute__((target("neon"))) poly16x8_t vrev32q_p16(poly16x8_t __p0) {
  25144   poly16x8_t __ret;
  25145   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6);
  25146   return __ret;
  25147 }
  25148 #else
  25149 __ai __attribute__((target("neon"))) poly16x8_t vrev32q_p16(poly16x8_t __p0) {
  25150   poly16x8_t __ret;
  25151   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25152   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6);
  25153   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25154   return __ret;
  25155 }
  25156 #endif
  25157 
  25158 #ifdef __LITTLE_ENDIAN__
  25159 __ai __attribute__((target("neon"))) uint8x16_t vrev32q_u8(uint8x16_t __p0) {
  25160   uint8x16_t __ret;
  25161   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12);
  25162   return __ret;
  25163 }
  25164 #else
  25165 __ai __attribute__((target("neon"))) uint8x16_t vrev32q_u8(uint8x16_t __p0) {
  25166   uint8x16_t __ret;
  25167   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25168   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12);
  25169   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25170   return __ret;
  25171 }
  25172 #endif
  25173 
  25174 #ifdef __LITTLE_ENDIAN__
  25175 __ai __attribute__((target("neon"))) uint16x8_t vrev32q_u16(uint16x8_t __p0) {
  25176   uint16x8_t __ret;
  25177   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6);
  25178   return __ret;
  25179 }
  25180 #else
  25181 __ai __attribute__((target("neon"))) uint16x8_t vrev32q_u16(uint16x8_t __p0) {
  25182   uint16x8_t __ret;
  25183   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25184   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6);
  25185   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25186   return __ret;
  25187 }
  25188 #endif
  25189 
  25190 #ifdef __LITTLE_ENDIAN__
  25191 __ai __attribute__((target("neon"))) int8x16_t vrev32q_s8(int8x16_t __p0) {
  25192   int8x16_t __ret;
  25193   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12);
  25194   return __ret;
  25195 }
  25196 #else
  25197 __ai __attribute__((target("neon"))) int8x16_t vrev32q_s8(int8x16_t __p0) {
  25198   int8x16_t __ret;
  25199   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25200   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12);
  25201   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25202   return __ret;
  25203 }
  25204 #endif
  25205 
  25206 #ifdef __LITTLE_ENDIAN__
  25207 __ai __attribute__((target("neon"))) int16x8_t vrev32q_s16(int16x8_t __p0) {
  25208   int16x8_t __ret;
  25209   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6);
  25210   return __ret;
  25211 }
  25212 #else
  25213 __ai __attribute__((target("neon"))) int16x8_t vrev32q_s16(int16x8_t __p0) {
  25214   int16x8_t __ret;
  25215   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25216   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6);
  25217   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25218   return __ret;
  25219 }
  25220 #endif
  25221 
  25222 #ifdef __LITTLE_ENDIAN__
  25223 __ai __attribute__((target("neon"))) uint8x8_t vrev32_u8(uint8x8_t __p0) {
  25224   uint8x8_t __ret;
  25225   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25226   return __ret;
  25227 }
  25228 #else
  25229 __ai __attribute__((target("neon"))) uint8x8_t vrev32_u8(uint8x8_t __p0) {
  25230   uint8x8_t __ret;
  25231   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25232   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25233   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25234   return __ret;
  25235 }
  25236 #endif
  25237 
  25238 #ifdef __LITTLE_ENDIAN__
  25239 __ai __attribute__((target("neon"))) uint16x4_t vrev32_u16(uint16x4_t __p0) {
  25240   uint16x4_t __ret;
  25241   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2);
  25242   return __ret;
  25243 }
  25244 #else
  25245 __ai __attribute__((target("neon"))) uint16x4_t vrev32_u16(uint16x4_t __p0) {
  25246   uint16x4_t __ret;
  25247   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25248   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2);
  25249   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25250   return __ret;
  25251 }
  25252 #endif
  25253 
  25254 #ifdef __LITTLE_ENDIAN__
  25255 __ai __attribute__((target("neon"))) int8x8_t vrev32_s8(int8x8_t __p0) {
  25256   int8x8_t __ret;
  25257   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25258   return __ret;
  25259 }
  25260 #else
  25261 __ai __attribute__((target("neon"))) int8x8_t vrev32_s8(int8x8_t __p0) {
  25262   int8x8_t __ret;
  25263   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25264   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25265   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25266   return __ret;
  25267 }
  25268 #endif
  25269 
  25270 #ifdef __LITTLE_ENDIAN__
  25271 __ai __attribute__((target("neon"))) int16x4_t vrev32_s16(int16x4_t __p0) {
  25272   int16x4_t __ret;
  25273   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2);
  25274   return __ret;
  25275 }
  25276 #else
  25277 __ai __attribute__((target("neon"))) int16x4_t vrev32_s16(int16x4_t __p0) {
  25278   int16x4_t __ret;
  25279   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25280   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2);
  25281   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25282   return __ret;
  25283 }
  25284 #endif
  25285 
  25286 #ifdef __LITTLE_ENDIAN__
  25287 __ai __attribute__((target("neon"))) poly8x8_t vrev64_p8(poly8x8_t __p0) {
  25288   poly8x8_t __ret;
  25289   __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25290   return __ret;
  25291 }
  25292 #else
  25293 __ai __attribute__((target("neon"))) poly8x8_t vrev64_p8(poly8x8_t __p0) {
  25294   poly8x8_t __ret;
  25295   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25296   __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0);
  25297   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25298   return __ret;
  25299 }
  25300 #endif
  25301 
  25302 #ifdef __LITTLE_ENDIAN__
  25303 __ai __attribute__((target("neon"))) poly16x4_t vrev64_p16(poly16x4_t __p0) {
  25304   poly16x4_t __ret;
  25305   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25306   return __ret;
  25307 }
  25308 #else
  25309 __ai __attribute__((target("neon"))) poly16x4_t vrev64_p16(poly16x4_t __p0) {
  25310   poly16x4_t __ret;
  25311   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25312   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0);
  25313   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25314   return __ret;
  25315 }
  25316 #endif
  25317 
  25318 #ifdef __LITTLE_ENDIAN__
  25319 __ai __attribute__((target("neon"))) poly8x16_t vrev64q_p8(poly8x16_t __p0) {
  25320   poly8x16_t __ret;
  25321   __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8);
  25322   return __ret;
  25323 }
  25324 #else
  25325 __ai __attribute__((target("neon"))) poly8x16_t vrev64q_p8(poly8x16_t __p0) {
  25326   poly8x16_t __ret;
  25327   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25328   __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8);
  25329   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25330   return __ret;
  25331 }
  25332 #endif
  25333 
  25334 #ifdef __LITTLE_ENDIAN__
  25335 __ai __attribute__((target("neon"))) poly16x8_t vrev64q_p16(poly16x8_t __p0) {
  25336   poly16x8_t __ret;
  25337   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25338   return __ret;
  25339 }
  25340 #else
  25341 __ai __attribute__((target("neon"))) poly16x8_t vrev64q_p16(poly16x8_t __p0) {
  25342   poly16x8_t __ret;
  25343   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25344   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25345   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25346   return __ret;
  25347 }
  25348 #endif
  25349 
  25350 #ifdef __LITTLE_ENDIAN__
  25351 __ai __attribute__((target("neon"))) uint8x16_t vrev64q_u8(uint8x16_t __p0) {
  25352   uint8x16_t __ret;
  25353   __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8);
  25354   return __ret;
  25355 }
  25356 #else
  25357 __ai __attribute__((target("neon"))) uint8x16_t vrev64q_u8(uint8x16_t __p0) {
  25358   uint8x16_t __ret;
  25359   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25360   __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8);
  25361   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25362   return __ret;
  25363 }
  25364 #endif
  25365 
  25366 #ifdef __LITTLE_ENDIAN__
  25367 __ai __attribute__((target("neon"))) uint32x4_t vrev64q_u32(uint32x4_t __p0) {
  25368   uint32x4_t __ret;
  25369   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2);
  25370   return __ret;
  25371 }
  25372 #else
  25373 __ai __attribute__((target("neon"))) uint32x4_t vrev64q_u32(uint32x4_t __p0) {
  25374   uint32x4_t __ret;
  25375   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25376   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2);
  25377   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25378   return __ret;
  25379 }
  25380 #endif
  25381 
  25382 #ifdef __LITTLE_ENDIAN__
  25383 __ai __attribute__((target("neon"))) uint16x8_t vrev64q_u16(uint16x8_t __p0) {
  25384   uint16x8_t __ret;
  25385   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25386   return __ret;
  25387 }
  25388 #else
  25389 __ai __attribute__((target("neon"))) uint16x8_t vrev64q_u16(uint16x8_t __p0) {
  25390   uint16x8_t __ret;
  25391   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25392   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25393   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25394   return __ret;
  25395 }
  25396 #endif
  25397 
  25398 #ifdef __LITTLE_ENDIAN__
  25399 __ai __attribute__((target("neon"))) int8x16_t vrev64q_s8(int8x16_t __p0) {
  25400   int8x16_t __ret;
  25401   __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8);
  25402   return __ret;
  25403 }
  25404 #else
  25405 __ai __attribute__((target("neon"))) int8x16_t vrev64q_s8(int8x16_t __p0) {
  25406   int8x16_t __ret;
  25407   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25408   __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8);
  25409   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25410   return __ret;
  25411 }
  25412 #endif
  25413 
  25414 #ifdef __LITTLE_ENDIAN__
  25415 __ai __attribute__((target("neon"))) float32x4_t vrev64q_f32(float32x4_t __p0) {
  25416   float32x4_t __ret;
  25417   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2);
  25418   return __ret;
  25419 }
  25420 #else
  25421 __ai __attribute__((target("neon"))) float32x4_t vrev64q_f32(float32x4_t __p0) {
  25422   float32x4_t __ret;
  25423   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25424   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2);
  25425   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25426   return __ret;
  25427 }
  25428 #endif
  25429 
  25430 #ifdef __LITTLE_ENDIAN__
  25431 __ai __attribute__((target("neon"))) int32x4_t vrev64q_s32(int32x4_t __p0) {
  25432   int32x4_t __ret;
  25433   __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2);
  25434   return __ret;
  25435 }
  25436 #else
  25437 __ai __attribute__((target("neon"))) int32x4_t vrev64q_s32(int32x4_t __p0) {
  25438   int32x4_t __ret;
  25439   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25440   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2);
  25441   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25442   return __ret;
  25443 }
  25444 #endif
  25445 
  25446 #ifdef __LITTLE_ENDIAN__
  25447 __ai __attribute__((target("neon"))) int16x8_t vrev64q_s16(int16x8_t __p0) {
  25448   int16x8_t __ret;
  25449   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25450   return __ret;
  25451 }
  25452 #else
  25453 __ai __attribute__((target("neon"))) int16x8_t vrev64q_s16(int16x8_t __p0) {
  25454   int16x8_t __ret;
  25455   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25456   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25457   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25458   return __ret;
  25459 }
  25460 #endif
  25461 
  25462 #ifdef __LITTLE_ENDIAN__
  25463 __ai __attribute__((target("neon"))) uint8x8_t vrev64_u8(uint8x8_t __p0) {
  25464   uint8x8_t __ret;
  25465   __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25466   return __ret;
  25467 }
  25468 #else
  25469 __ai __attribute__((target("neon"))) uint8x8_t vrev64_u8(uint8x8_t __p0) {
  25470   uint8x8_t __ret;
  25471   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25472   __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0);
  25473   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25474   return __ret;
  25475 }
  25476 #endif
  25477 
  25478 #ifdef __LITTLE_ENDIAN__
  25479 __ai __attribute__((target("neon"))) uint32x2_t vrev64_u32(uint32x2_t __p0) {
  25480   uint32x2_t __ret;
  25481   __ret = __builtin_shufflevector(__p0, __p0, 1, 0);
  25482   return __ret;
  25483 }
  25484 #else
  25485 __ai __attribute__((target("neon"))) uint32x2_t vrev64_u32(uint32x2_t __p0) {
  25486   uint32x2_t __ret;
  25487   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25488   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0);
  25489   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25490   return __ret;
  25491 }
  25492 #endif
  25493 
  25494 #ifdef __LITTLE_ENDIAN__
  25495 __ai __attribute__((target("neon"))) uint16x4_t vrev64_u16(uint16x4_t __p0) {
  25496   uint16x4_t __ret;
  25497   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25498   return __ret;
  25499 }
  25500 #else
  25501 __ai __attribute__((target("neon"))) uint16x4_t vrev64_u16(uint16x4_t __p0) {
  25502   uint16x4_t __ret;
  25503   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25504   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0);
  25505   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25506   return __ret;
  25507 }
  25508 #endif
  25509 
  25510 #ifdef __LITTLE_ENDIAN__
  25511 __ai __attribute__((target("neon"))) int8x8_t vrev64_s8(int8x8_t __p0) {
  25512   int8x8_t __ret;
  25513   __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25514   return __ret;
  25515 }
  25516 #else
  25517 __ai __attribute__((target("neon"))) int8x8_t vrev64_s8(int8x8_t __p0) {
  25518   int8x8_t __ret;
  25519   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25520   __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0);
  25521   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25522   return __ret;
  25523 }
  25524 #endif
  25525 
  25526 #ifdef __LITTLE_ENDIAN__
  25527 __ai __attribute__((target("neon"))) float32x2_t vrev64_f32(float32x2_t __p0) {
  25528   float32x2_t __ret;
  25529   __ret = __builtin_shufflevector(__p0, __p0, 1, 0);
  25530   return __ret;
  25531 }
  25532 #else
  25533 __ai __attribute__((target("neon"))) float32x2_t vrev64_f32(float32x2_t __p0) {
  25534   float32x2_t __ret;
  25535   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25536   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0);
  25537   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25538   return __ret;
  25539 }
  25540 #endif
  25541 
  25542 #ifdef __LITTLE_ENDIAN__
  25543 __ai __attribute__((target("neon"))) int32x2_t vrev64_s32(int32x2_t __p0) {
  25544   int32x2_t __ret;
  25545   __ret = __builtin_shufflevector(__p0, __p0, 1, 0);
  25546   return __ret;
  25547 }
  25548 #else
  25549 __ai __attribute__((target("neon"))) int32x2_t vrev64_s32(int32x2_t __p0) {
  25550   int32x2_t __ret;
  25551   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25552   __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0);
  25553   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25554   return __ret;
  25555 }
  25556 #endif
  25557 
  25558 #ifdef __LITTLE_ENDIAN__
  25559 __ai __attribute__((target("neon"))) int16x4_t vrev64_s16(int16x4_t __p0) {
  25560   int16x4_t __ret;
  25561   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25562   return __ret;
  25563 }
  25564 #else
  25565 __ai __attribute__((target("neon"))) int16x4_t vrev64_s16(int16x4_t __p0) {
  25566   int16x4_t __ret;
  25567   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25568   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0);
  25569   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25570   return __ret;
  25571 }
  25572 #endif
  25573 
  25574 #ifdef __LITTLE_ENDIAN__
  25575 __ai __attribute__((target("neon"))) float16x8_t vrev64q_f16(float16x8_t __p0) {
  25576   float16x8_t __ret;
  25577   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4);
  25578   return __ret;
  25579 }
  25580 #else
  25581 __ai __attribute__((target("neon"))) float16x8_t vrev64q_f16(float16x8_t __p0) {
  25582   float16x8_t __ret;
  25583   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25584   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4);
  25585   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25586   return __ret;
  25587 }
  25588 #endif
  25589 
  25590 #ifdef __LITTLE_ENDIAN__
  25591 __ai __attribute__((target("neon"))) float16x4_t vrev64_f16(float16x4_t __p0) {
  25592   float16x4_t __ret;
  25593   __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25594   return __ret;
  25595 }
  25596 #else
  25597 __ai __attribute__((target("neon"))) float16x4_t vrev64_f16(float16x4_t __p0) {
  25598   float16x4_t __ret;
  25599   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25600   __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0);
  25601   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25602   return __ret;
  25603 }
  25604 #endif
  25605 
  25606 #ifdef __LITTLE_ENDIAN__
  25607 __ai __attribute__((target("neon"))) uint8x16_t vrhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  25608   uint8x16_t __ret;
  25609   __ret = (uint8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  25610   return __ret;
  25611 }
  25612 #else
  25613 __ai __attribute__((target("neon"))) uint8x16_t vrhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  25614   uint8x16_t __ret;
  25615   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25616   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25617   __ret = (uint8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  25618   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25619   return __ret;
  25620 }
  25621 #endif
  25622 
  25623 #ifdef __LITTLE_ENDIAN__
  25624 __ai __attribute__((target("neon"))) uint32x4_t vrhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  25625   uint32x4_t __ret;
  25626   __ret = (uint32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  25627   return __ret;
  25628 }
  25629 #else
  25630 __ai __attribute__((target("neon"))) uint32x4_t vrhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  25631   uint32x4_t __ret;
  25632   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25633   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25634   __ret = (uint32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  25635   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25636   return __ret;
  25637 }
  25638 #endif
  25639 
  25640 #ifdef __LITTLE_ENDIAN__
  25641 __ai __attribute__((target("neon"))) uint16x8_t vrhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  25642   uint16x8_t __ret;
  25643   __ret = (uint16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  25644   return __ret;
  25645 }
  25646 #else
  25647 __ai __attribute__((target("neon"))) uint16x8_t vrhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  25648   uint16x8_t __ret;
  25649   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25650   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25651   __ret = (uint16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  25652   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25653   return __ret;
  25654 }
  25655 #endif
  25656 
  25657 #ifdef __LITTLE_ENDIAN__
  25658 __ai __attribute__((target("neon"))) int8x16_t vrhaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  25659   int8x16_t __ret;
  25660   __ret = (int8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  25661   return __ret;
  25662 }
  25663 #else
  25664 __ai __attribute__((target("neon"))) int8x16_t vrhaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  25665   int8x16_t __ret;
  25666   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25667   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25668   __ret = (int8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  25669   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25670   return __ret;
  25671 }
  25672 #endif
  25673 
  25674 #ifdef __LITTLE_ENDIAN__
  25675 __ai __attribute__((target("neon"))) int32x4_t vrhaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  25676   int32x4_t __ret;
  25677   __ret = (int32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  25678   return __ret;
  25679 }
  25680 #else
  25681 __ai __attribute__((target("neon"))) int32x4_t vrhaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  25682   int32x4_t __ret;
  25683   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25684   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25685   __ret = (int32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  25686   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25687   return __ret;
  25688 }
  25689 #endif
  25690 
  25691 #ifdef __LITTLE_ENDIAN__
  25692 __ai __attribute__((target("neon"))) int16x8_t vrhaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  25693   int16x8_t __ret;
  25694   __ret = (int16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  25695   return __ret;
  25696 }
  25697 #else
  25698 __ai __attribute__((target("neon"))) int16x8_t vrhaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  25699   int16x8_t __ret;
  25700   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25701   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25702   __ret = (int16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  25703   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25704   return __ret;
  25705 }
  25706 #endif
  25707 
  25708 #ifdef __LITTLE_ENDIAN__
  25709 __ai __attribute__((target("neon"))) uint8x8_t vrhadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  25710   uint8x8_t __ret;
  25711   __ret = (uint8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  25712   return __ret;
  25713 }
  25714 #else
  25715 __ai __attribute__((target("neon"))) uint8x8_t vrhadd_u8(uint8x8_t __p0, uint8x8_t __p1) {
  25716   uint8x8_t __ret;
  25717   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25718   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25719   __ret = (uint8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  25720   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25721   return __ret;
  25722 }
  25723 #endif
  25724 
  25725 #ifdef __LITTLE_ENDIAN__
  25726 __ai __attribute__((target("neon"))) uint32x2_t vrhadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  25727   uint32x2_t __ret;
  25728   __ret = (uint32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  25729   return __ret;
  25730 }
  25731 #else
  25732 __ai __attribute__((target("neon"))) uint32x2_t vrhadd_u32(uint32x2_t __p0, uint32x2_t __p1) {
  25733   uint32x2_t __ret;
  25734   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25735   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  25736   __ret = (uint32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  25737   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25738   return __ret;
  25739 }
  25740 #endif
  25741 
  25742 #ifdef __LITTLE_ENDIAN__
  25743 __ai __attribute__((target("neon"))) uint16x4_t vrhadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  25744   uint16x4_t __ret;
  25745   __ret = (uint16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  25746   return __ret;
  25747 }
  25748 #else
  25749 __ai __attribute__((target("neon"))) uint16x4_t vrhadd_u16(uint16x4_t __p0, uint16x4_t __p1) {
  25750   uint16x4_t __ret;
  25751   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25752   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25753   __ret = (uint16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  25754   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25755   return __ret;
  25756 }
  25757 #endif
  25758 
  25759 #ifdef __LITTLE_ENDIAN__
  25760 __ai __attribute__((target("neon"))) int8x8_t vrhadd_s8(int8x8_t __p0, int8x8_t __p1) {
  25761   int8x8_t __ret;
  25762   __ret = (int8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  25763   return __ret;
  25764 }
  25765 #else
  25766 __ai __attribute__((target("neon"))) int8x8_t vrhadd_s8(int8x8_t __p0, int8x8_t __p1) {
  25767   int8x8_t __ret;
  25768   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25769   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25770   __ret = (int8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  25771   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25772   return __ret;
  25773 }
  25774 #endif
  25775 
  25776 #ifdef __LITTLE_ENDIAN__
  25777 __ai __attribute__((target("neon"))) int32x2_t vrhadd_s32(int32x2_t __p0, int32x2_t __p1) {
  25778   int32x2_t __ret;
  25779   __ret = (int32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  25780   return __ret;
  25781 }
  25782 #else
  25783 __ai __attribute__((target("neon"))) int32x2_t vrhadd_s32(int32x2_t __p0, int32x2_t __p1) {
  25784   int32x2_t __ret;
  25785   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25786   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  25787   __ret = (int32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  25788   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25789   return __ret;
  25790 }
  25791 #endif
  25792 
  25793 #ifdef __LITTLE_ENDIAN__
  25794 __ai __attribute__((target("neon"))) int16x4_t vrhadd_s16(int16x4_t __p0, int16x4_t __p1) {
  25795   int16x4_t __ret;
  25796   __ret = (int16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  25797   return __ret;
  25798 }
  25799 #else
  25800 __ai __attribute__((target("neon"))) int16x4_t vrhadd_s16(int16x4_t __p0, int16x4_t __p1) {
  25801   int16x4_t __ret;
  25802   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25803   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25804   __ret = (int16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  25805   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25806   return __ret;
  25807 }
  25808 #endif
  25809 
  25810 #ifdef __LITTLE_ENDIAN__
  25811 __ai __attribute__((target("neon"))) uint8x16_t vrshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  25812   uint8x16_t __ret;
  25813   __ret = (uint8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  25814   return __ret;
  25815 }
  25816 #else
  25817 __ai __attribute__((target("neon"))) uint8x16_t vrshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  25818   uint8x16_t __ret;
  25819   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25820   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25821   __ret = (uint8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  25822   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25823   return __ret;
  25824 }
  25825 #endif
  25826 
  25827 #ifdef __LITTLE_ENDIAN__
  25828 __ai __attribute__((target("neon"))) uint32x4_t vrshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  25829   uint32x4_t __ret;
  25830   __ret = (uint32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  25831   return __ret;
  25832 }
  25833 #else
  25834 __ai __attribute__((target("neon"))) uint32x4_t vrshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  25835   uint32x4_t __ret;
  25836   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25837   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25838   __ret = (uint32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  25839   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25840   return __ret;
  25841 }
  25842 #endif
  25843 
  25844 #ifdef __LITTLE_ENDIAN__
  25845 __ai __attribute__((target("neon"))) uint64x2_t vrshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  25846   uint64x2_t __ret;
  25847   __ret = (uint64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  25848   return __ret;
  25849 }
  25850 #else
  25851 __ai __attribute__((target("neon"))) uint64x2_t vrshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  25852   uint64x2_t __ret;
  25853   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25854   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  25855   __ret = (uint64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  25856   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25857   return __ret;
  25858 }
  25859 #endif
  25860 
  25861 #ifdef __LITTLE_ENDIAN__
  25862 __ai __attribute__((target("neon"))) uint16x8_t vrshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  25863   uint16x8_t __ret;
  25864   __ret = (uint16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  25865   return __ret;
  25866 }
  25867 #else
  25868 __ai __attribute__((target("neon"))) uint16x8_t vrshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  25869   uint16x8_t __ret;
  25870   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25871   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25872   __ret = (uint16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  25873   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25874   return __ret;
  25875 }
  25876 #endif
  25877 
  25878 #ifdef __LITTLE_ENDIAN__
  25879 __ai __attribute__((target("neon"))) int8x16_t vrshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  25880   int8x16_t __ret;
  25881   __ret = (int8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  25882   return __ret;
  25883 }
  25884 #else
  25885 __ai __attribute__((target("neon"))) int8x16_t vrshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  25886   int8x16_t __ret;
  25887   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25888   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25889   __ret = (int8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  25890   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  25891   return __ret;
  25892 }
  25893 #endif
  25894 
  25895 #ifdef __LITTLE_ENDIAN__
  25896 __ai __attribute__((target("neon"))) int32x4_t vrshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  25897   int32x4_t __ret;
  25898   __ret = (int32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  25899   return __ret;
  25900 }
  25901 #else
  25902 __ai __attribute__((target("neon"))) int32x4_t vrshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  25903   int32x4_t __ret;
  25904   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25905   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25906   __ret = (int32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  25907   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25908   return __ret;
  25909 }
  25910 #endif
  25911 
  25912 #ifdef __LITTLE_ENDIAN__
  25913 __ai __attribute__((target("neon"))) int64x2_t vrshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  25914   int64x2_t __ret;
  25915   __ret = (int64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  25916   return __ret;
  25917 }
  25918 #else
  25919 __ai __attribute__((target("neon"))) int64x2_t vrshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  25920   int64x2_t __ret;
  25921   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25922   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  25923   __ret = (int64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  25924   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25925   return __ret;
  25926 }
  25927 #endif
  25928 
  25929 #ifdef __LITTLE_ENDIAN__
  25930 __ai __attribute__((target("neon"))) int16x8_t vrshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  25931   int16x8_t __ret;
  25932   __ret = (int16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  25933   return __ret;
  25934 }
  25935 #else
  25936 __ai __attribute__((target("neon"))) int16x8_t vrshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  25937   int16x8_t __ret;
  25938   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25939   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25940   __ret = (int16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  25941   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25942   return __ret;
  25943 }
  25944 #endif
  25945 
  25946 #ifdef __LITTLE_ENDIAN__
  25947 __ai __attribute__((target("neon"))) uint8x8_t vrshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  25948   uint8x8_t __ret;
  25949   __ret = (uint8x8_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  25950   return __ret;
  25951 }
  25952 #else
  25953 __ai __attribute__((target("neon"))) uint8x8_t vrshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  25954   uint8x8_t __ret;
  25955   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  25956   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  25957   __ret = (uint8x8_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  25958   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  25959   return __ret;
  25960 }
  25961 #endif
  25962 
  25963 #ifdef __LITTLE_ENDIAN__
  25964 __ai __attribute__((target("neon"))) uint32x2_t vrshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  25965   uint32x2_t __ret;
  25966   __ret = (uint32x2_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  25967   return __ret;
  25968 }
  25969 #else
  25970 __ai __attribute__((target("neon"))) uint32x2_t vrshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  25971   uint32x2_t __ret;
  25972   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  25973   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  25974   __ret = (uint32x2_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  25975   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  25976   return __ret;
  25977 }
  25978 #endif
  25979 
  25980 __ai __attribute__((target("neon"))) uint64x1_t vrshl_u64(uint64x1_t __p0, int64x1_t __p1) {
  25981   uint64x1_t __ret;
  25982   __ret = (uint64x1_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  25983   return __ret;
  25984 }
  25985 #ifdef __LITTLE_ENDIAN__
  25986 __ai __attribute__((target("neon"))) uint16x4_t vrshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  25987   uint16x4_t __ret;
  25988   __ret = (uint16x4_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  25989   return __ret;
  25990 }
  25991 #else
  25992 __ai __attribute__((target("neon"))) uint16x4_t vrshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  25993   uint16x4_t __ret;
  25994   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  25995   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  25996   __ret = (uint16x4_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  25997   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  25998   return __ret;
  25999 }
  26000 #endif
  26001 
  26002 #ifdef __LITTLE_ENDIAN__
  26003 __ai __attribute__((target("neon"))) int8x8_t vrshl_s8(int8x8_t __p0, int8x8_t __p1) {
  26004   int8x8_t __ret;
  26005   __ret = (int8x8_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  26006   return __ret;
  26007 }
  26008 #else
  26009 __ai __attribute__((target("neon"))) int8x8_t vrshl_s8(int8x8_t __p0, int8x8_t __p1) {
  26010   int8x8_t __ret;
  26011   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  26012   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  26013   __ret = (int8x8_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  26014   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  26015   return __ret;
  26016 }
  26017 #endif
  26018 
  26019 #ifdef __LITTLE_ENDIAN__
  26020 __ai __attribute__((target("neon"))) int32x2_t vrshl_s32(int32x2_t __p0, int32x2_t __p1) {
  26021   int32x2_t __ret;
  26022   __ret = (int32x2_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  26023   return __ret;
  26024 }
  26025 #else
  26026 __ai __attribute__((target("neon"))) int32x2_t vrshl_s32(int32x2_t __p0, int32x2_t __p1) {
  26027   int32x2_t __ret;
  26028   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  26029   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  26030   __ret = (int32x2_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  26031   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  26032   return __ret;
  26033 }
  26034 #endif
  26035 
  26036 __ai __attribute__((target("neon"))) int64x1_t vrshl_s64(int64x1_t __p0, int64x1_t __p1) {
  26037   int64x1_t __ret;
  26038   __ret = (int64x1_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  26039   return __ret;
  26040 }
  26041 #ifdef __LITTLE_ENDIAN__
  26042 __ai __attribute__((target("neon"))) int16x4_t vrshl_s16(int16x4_t __p0, int16x4_t __p1) {
  26043   int16x4_t __ret;
  26044   __ret = (int16x4_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  26045   return __ret;
  26046 }
  26047 #else
  26048 __ai __attribute__((target("neon"))) int16x4_t vrshl_s16(int16x4_t __p0, int16x4_t __p1) {
  26049   int16x4_t __ret;
  26050   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  26051   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  26052   __ret = (int16x4_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  26053   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  26054   return __ret;
  26055 }
  26056 #endif
  26057 
  26058 #ifdef __LITTLE_ENDIAN__
  26059 #define vrshrq_n_u8(__p0, __p1) __extension__ ({ \
  26060   uint8x16_t __ret; \
  26061   uint8x16_t __s0 = __p0; \
  26062   __ret = (uint8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 48); \
  26063   __ret; \
  26064 })
  26065 #else
  26066 #define vrshrq_n_u8(__p0, __p1) __extension__ ({ \
  26067   uint8x16_t __ret; \
  26068   uint8x16_t __s0 = __p0; \
  26069   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26070   __ret = (uint8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 48); \
  26071   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26072   __ret; \
  26073 })
  26074 #endif
  26075 
  26076 #ifdef __LITTLE_ENDIAN__
  26077 #define vrshrq_n_u32(__p0, __p1) __extension__ ({ \
  26078   uint32x4_t __ret; \
  26079   uint32x4_t __s0 = __p0; \
  26080   __ret = (uint32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 50); \
  26081   __ret; \
  26082 })
  26083 #else
  26084 #define vrshrq_n_u32(__p0, __p1) __extension__ ({ \
  26085   uint32x4_t __ret; \
  26086   uint32x4_t __s0 = __p0; \
  26087   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26088   __ret = (uint32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 50); \
  26089   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26090   __ret; \
  26091 })
  26092 #endif
  26093 
  26094 #ifdef __LITTLE_ENDIAN__
  26095 #define vrshrq_n_u64(__p0, __p1) __extension__ ({ \
  26096   uint64x2_t __ret; \
  26097   uint64x2_t __s0 = __p0; \
  26098   __ret = (uint64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 51); \
  26099   __ret; \
  26100 })
  26101 #else
  26102 #define vrshrq_n_u64(__p0, __p1) __extension__ ({ \
  26103   uint64x2_t __ret; \
  26104   uint64x2_t __s0 = __p0; \
  26105   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26106   __ret = (uint64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 51); \
  26107   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26108   __ret; \
  26109 })
  26110 #endif
  26111 
  26112 #ifdef __LITTLE_ENDIAN__
  26113 #define vrshrq_n_u16(__p0, __p1) __extension__ ({ \
  26114   uint16x8_t __ret; \
  26115   uint16x8_t __s0 = __p0; \
  26116   __ret = (uint16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 49); \
  26117   __ret; \
  26118 })
  26119 #else
  26120 #define vrshrq_n_u16(__p0, __p1) __extension__ ({ \
  26121   uint16x8_t __ret; \
  26122   uint16x8_t __s0 = __p0; \
  26123   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26124   __ret = (uint16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 49); \
  26125   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26126   __ret; \
  26127 })
  26128 #endif
  26129 
  26130 #ifdef __LITTLE_ENDIAN__
  26131 #define vrshrq_n_s8(__p0, __p1) __extension__ ({ \
  26132   int8x16_t __ret; \
  26133   int8x16_t __s0 = __p0; \
  26134   __ret = (int8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 32); \
  26135   __ret; \
  26136 })
  26137 #else
  26138 #define vrshrq_n_s8(__p0, __p1) __extension__ ({ \
  26139   int8x16_t __ret; \
  26140   int8x16_t __s0 = __p0; \
  26141   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26142   __ret = (int8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 32); \
  26143   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26144   __ret; \
  26145 })
  26146 #endif
  26147 
  26148 #ifdef __LITTLE_ENDIAN__
  26149 #define vrshrq_n_s32(__p0, __p1) __extension__ ({ \
  26150   int32x4_t __ret; \
  26151   int32x4_t __s0 = __p0; \
  26152   __ret = (int32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 34); \
  26153   __ret; \
  26154 })
  26155 #else
  26156 #define vrshrq_n_s32(__p0, __p1) __extension__ ({ \
  26157   int32x4_t __ret; \
  26158   int32x4_t __s0 = __p0; \
  26159   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26160   __ret = (int32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 34); \
  26161   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26162   __ret; \
  26163 })
  26164 #endif
  26165 
  26166 #ifdef __LITTLE_ENDIAN__
  26167 #define vrshrq_n_s64(__p0, __p1) __extension__ ({ \
  26168   int64x2_t __ret; \
  26169   int64x2_t __s0 = __p0; \
  26170   __ret = (int64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 35); \
  26171   __ret; \
  26172 })
  26173 #else
  26174 #define vrshrq_n_s64(__p0, __p1) __extension__ ({ \
  26175   int64x2_t __ret; \
  26176   int64x2_t __s0 = __p0; \
  26177   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26178   __ret = (int64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 35); \
  26179   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26180   __ret; \
  26181 })
  26182 #endif
  26183 
  26184 #ifdef __LITTLE_ENDIAN__
  26185 #define vrshrq_n_s16(__p0, __p1) __extension__ ({ \
  26186   int16x8_t __ret; \
  26187   int16x8_t __s0 = __p0; \
  26188   __ret = (int16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 33); \
  26189   __ret; \
  26190 })
  26191 #else
  26192 #define vrshrq_n_s16(__p0, __p1) __extension__ ({ \
  26193   int16x8_t __ret; \
  26194   int16x8_t __s0 = __p0; \
  26195   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26196   __ret = (int16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 33); \
  26197   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26198   __ret; \
  26199 })
  26200 #endif
  26201 
  26202 #ifdef __LITTLE_ENDIAN__
  26203 #define vrshr_n_u8(__p0, __p1) __extension__ ({ \
  26204   uint8x8_t __ret; \
  26205   uint8x8_t __s0 = __p0; \
  26206   __ret = (uint8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 16); \
  26207   __ret; \
  26208 })
  26209 #else
  26210 #define vrshr_n_u8(__p0, __p1) __extension__ ({ \
  26211   uint8x8_t __ret; \
  26212   uint8x8_t __s0 = __p0; \
  26213   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26214   __ret = (uint8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 16); \
  26215   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26216   __ret; \
  26217 })
  26218 #endif
  26219 
  26220 #ifdef __LITTLE_ENDIAN__
  26221 #define vrshr_n_u32(__p0, __p1) __extension__ ({ \
  26222   uint32x2_t __ret; \
  26223   uint32x2_t __s0 = __p0; \
  26224   __ret = (uint32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 18); \
  26225   __ret; \
  26226 })
  26227 #else
  26228 #define vrshr_n_u32(__p0, __p1) __extension__ ({ \
  26229   uint32x2_t __ret; \
  26230   uint32x2_t __s0 = __p0; \
  26231   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26232   __ret = (uint32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 18); \
  26233   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26234   __ret; \
  26235 })
  26236 #endif
  26237 
  26238 #define vrshr_n_u64(__p0, __p1) __extension__ ({ \
  26239   uint64x1_t __ret; \
  26240   uint64x1_t __s0 = __p0; \
  26241   __ret = (uint64x1_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 19); \
  26242   __ret; \
  26243 })
  26244 #ifdef __LITTLE_ENDIAN__
  26245 #define vrshr_n_u16(__p0, __p1) __extension__ ({ \
  26246   uint16x4_t __ret; \
  26247   uint16x4_t __s0 = __p0; \
  26248   __ret = (uint16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 17); \
  26249   __ret; \
  26250 })
  26251 #else
  26252 #define vrshr_n_u16(__p0, __p1) __extension__ ({ \
  26253   uint16x4_t __ret; \
  26254   uint16x4_t __s0 = __p0; \
  26255   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26256   __ret = (uint16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 17); \
  26257   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26258   __ret; \
  26259 })
  26260 #endif
  26261 
  26262 #ifdef __LITTLE_ENDIAN__
  26263 #define vrshr_n_s8(__p0, __p1) __extension__ ({ \
  26264   int8x8_t __ret; \
  26265   int8x8_t __s0 = __p0; \
  26266   __ret = (int8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 0); \
  26267   __ret; \
  26268 })
  26269 #else
  26270 #define vrshr_n_s8(__p0, __p1) __extension__ ({ \
  26271   int8x8_t __ret; \
  26272   int8x8_t __s0 = __p0; \
  26273   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26274   __ret = (int8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 0); \
  26275   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26276   __ret; \
  26277 })
  26278 #endif
  26279 
  26280 #ifdef __LITTLE_ENDIAN__
  26281 #define vrshr_n_s32(__p0, __p1) __extension__ ({ \
  26282   int32x2_t __ret; \
  26283   int32x2_t __s0 = __p0; \
  26284   __ret = (int32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 2); \
  26285   __ret; \
  26286 })
  26287 #else
  26288 #define vrshr_n_s32(__p0, __p1) __extension__ ({ \
  26289   int32x2_t __ret; \
  26290   int32x2_t __s0 = __p0; \
  26291   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26292   __ret = (int32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 2); \
  26293   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26294   __ret; \
  26295 })
  26296 #endif
  26297 
  26298 #define vrshr_n_s64(__p0, __p1) __extension__ ({ \
  26299   int64x1_t __ret; \
  26300   int64x1_t __s0 = __p0; \
  26301   __ret = (int64x1_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 3); \
  26302   __ret; \
  26303 })
  26304 #ifdef __LITTLE_ENDIAN__
  26305 #define vrshr_n_s16(__p0, __p1) __extension__ ({ \
  26306   int16x4_t __ret; \
  26307   int16x4_t __s0 = __p0; \
  26308   __ret = (int16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 1); \
  26309   __ret; \
  26310 })
  26311 #else
  26312 #define vrshr_n_s16(__p0, __p1) __extension__ ({ \
  26313   int16x4_t __ret; \
  26314   int16x4_t __s0 = __p0; \
  26315   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26316   __ret = (int16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 1); \
  26317   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26318   __ret; \
  26319 })
  26320 #endif
  26321 
  26322 #ifdef __LITTLE_ENDIAN__
  26323 #define vrshrn_n_u32(__p0, __p1) __extension__ ({ \
  26324   uint16x4_t __ret; \
  26325   uint32x4_t __s0 = __p0; \
  26326   __ret = (uint16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 17); \
  26327   __ret; \
  26328 })
  26329 #else
  26330 #define vrshrn_n_u32(__p0, __p1) __extension__ ({ \
  26331   uint16x4_t __ret; \
  26332   uint32x4_t __s0 = __p0; \
  26333   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26334   __ret = (uint16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 17); \
  26335   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26336   __ret; \
  26337 })
  26338 #define __noswap_vrshrn_n_u32(__p0, __p1) __extension__ ({ \
  26339   uint16x4_t __ret; \
  26340   uint32x4_t __s0 = __p0; \
  26341   __ret = (uint16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 17); \
  26342   __ret; \
  26343 })
  26344 #endif
  26345 
  26346 #ifdef __LITTLE_ENDIAN__
  26347 #define vrshrn_n_u64(__p0, __p1) __extension__ ({ \
  26348   uint32x2_t __ret; \
  26349   uint64x2_t __s0 = __p0; \
  26350   __ret = (uint32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 18); \
  26351   __ret; \
  26352 })
  26353 #else
  26354 #define vrshrn_n_u64(__p0, __p1) __extension__ ({ \
  26355   uint32x2_t __ret; \
  26356   uint64x2_t __s0 = __p0; \
  26357   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26358   __ret = (uint32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 18); \
  26359   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26360   __ret; \
  26361 })
  26362 #define __noswap_vrshrn_n_u64(__p0, __p1) __extension__ ({ \
  26363   uint32x2_t __ret; \
  26364   uint64x2_t __s0 = __p0; \
  26365   __ret = (uint32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 18); \
  26366   __ret; \
  26367 })
  26368 #endif
  26369 
  26370 #ifdef __LITTLE_ENDIAN__
  26371 #define vrshrn_n_u16(__p0, __p1) __extension__ ({ \
  26372   uint8x8_t __ret; \
  26373   uint16x8_t __s0 = __p0; \
  26374   __ret = (uint8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 16); \
  26375   __ret; \
  26376 })
  26377 #else
  26378 #define vrshrn_n_u16(__p0, __p1) __extension__ ({ \
  26379   uint8x8_t __ret; \
  26380   uint16x8_t __s0 = __p0; \
  26381   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26382   __ret = (uint8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 16); \
  26383   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26384   __ret; \
  26385 })
  26386 #define __noswap_vrshrn_n_u16(__p0, __p1) __extension__ ({ \
  26387   uint8x8_t __ret; \
  26388   uint16x8_t __s0 = __p0; \
  26389   __ret = (uint8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 16); \
  26390   __ret; \
  26391 })
  26392 #endif
  26393 
  26394 #ifdef __LITTLE_ENDIAN__
  26395 #define vrshrn_n_s32(__p0, __p1) __extension__ ({ \
  26396   int16x4_t __ret; \
  26397   int32x4_t __s0 = __p0; \
  26398   __ret = (int16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 1); \
  26399   __ret; \
  26400 })
  26401 #else
  26402 #define vrshrn_n_s32(__p0, __p1) __extension__ ({ \
  26403   int16x4_t __ret; \
  26404   int32x4_t __s0 = __p0; \
  26405   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26406   __ret = (int16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 1); \
  26407   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26408   __ret; \
  26409 })
  26410 #define __noswap_vrshrn_n_s32(__p0, __p1) __extension__ ({ \
  26411   int16x4_t __ret; \
  26412   int32x4_t __s0 = __p0; \
  26413   __ret = (int16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 1); \
  26414   __ret; \
  26415 })
  26416 #endif
  26417 
  26418 #ifdef __LITTLE_ENDIAN__
  26419 #define vrshrn_n_s64(__p0, __p1) __extension__ ({ \
  26420   int32x2_t __ret; \
  26421   int64x2_t __s0 = __p0; \
  26422   __ret = (int32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 2); \
  26423   __ret; \
  26424 })
  26425 #else
  26426 #define vrshrn_n_s64(__p0, __p1) __extension__ ({ \
  26427   int32x2_t __ret; \
  26428   int64x2_t __s0 = __p0; \
  26429   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26430   __ret = (int32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 2); \
  26431   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26432   __ret; \
  26433 })
  26434 #define __noswap_vrshrn_n_s64(__p0, __p1) __extension__ ({ \
  26435   int32x2_t __ret; \
  26436   int64x2_t __s0 = __p0; \
  26437   __ret = (int32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 2); \
  26438   __ret; \
  26439 })
  26440 #endif
  26441 
  26442 #ifdef __LITTLE_ENDIAN__
  26443 #define vrshrn_n_s16(__p0, __p1) __extension__ ({ \
  26444   int8x8_t __ret; \
  26445   int16x8_t __s0 = __p0; \
  26446   __ret = (int8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 0); \
  26447   __ret; \
  26448 })
  26449 #else
  26450 #define vrshrn_n_s16(__p0, __p1) __extension__ ({ \
  26451   int8x8_t __ret; \
  26452   int16x8_t __s0 = __p0; \
  26453   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26454   __ret = (int8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 0); \
  26455   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26456   __ret; \
  26457 })
  26458 #define __noswap_vrshrn_n_s16(__p0, __p1) __extension__ ({ \
  26459   int8x8_t __ret; \
  26460   int16x8_t __s0 = __p0; \
  26461   __ret = (int8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 0); \
  26462   __ret; \
  26463 })
  26464 #endif
  26465 
  26466 #ifdef __LITTLE_ENDIAN__
  26467 __ai __attribute__((target("neon"))) uint32x4_t vrsqrteq_u32(uint32x4_t __p0) {
  26468   uint32x4_t __ret;
  26469   __ret = (uint32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__p0, 50);
  26470   return __ret;
  26471 }
  26472 #else
  26473 __ai __attribute__((target("neon"))) uint32x4_t vrsqrteq_u32(uint32x4_t __p0) {
  26474   uint32x4_t __ret;
  26475   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  26476   __ret = (uint32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__rev0, 50);
  26477   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  26478   return __ret;
  26479 }
  26480 #endif
  26481 
  26482 #ifdef __LITTLE_ENDIAN__
  26483 __ai __attribute__((target("neon"))) float32x4_t vrsqrteq_f32(float32x4_t __p0) {
  26484   float32x4_t __ret;
  26485   __ret = (float32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__p0, 41);
  26486   return __ret;
  26487 }
  26488 #else
  26489 __ai __attribute__((target("neon"))) float32x4_t vrsqrteq_f32(float32x4_t __p0) {
  26490   float32x4_t __ret;
  26491   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  26492   __ret = (float32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__rev0, 41);
  26493   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  26494   return __ret;
  26495 }
  26496 #endif
  26497 
  26498 #ifdef __LITTLE_ENDIAN__
  26499 __ai __attribute__((target("neon"))) uint32x2_t vrsqrte_u32(uint32x2_t __p0) {
  26500   uint32x2_t __ret;
  26501   __ret = (uint32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__p0, 18);
  26502   return __ret;
  26503 }
  26504 #else
  26505 __ai __attribute__((target("neon"))) uint32x2_t vrsqrte_u32(uint32x2_t __p0) {
  26506   uint32x2_t __ret;
  26507   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  26508   __ret = (uint32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__rev0, 18);
  26509   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  26510   return __ret;
  26511 }
  26512 #endif
  26513 
  26514 #ifdef __LITTLE_ENDIAN__
  26515 __ai __attribute__((target("neon"))) float32x2_t vrsqrte_f32(float32x2_t __p0) {
  26516   float32x2_t __ret;
  26517   __ret = (float32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__p0, 9);
  26518   return __ret;
  26519 }
  26520 #else
  26521 __ai __attribute__((target("neon"))) float32x2_t vrsqrte_f32(float32x2_t __p0) {
  26522   float32x2_t __ret;
  26523   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  26524   __ret = (float32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__rev0, 9);
  26525   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  26526   return __ret;
  26527 }
  26528 #endif
  26529 
  26530 #ifdef __LITTLE_ENDIAN__
  26531 __ai __attribute__((target("neon"))) float32x4_t vrsqrtsq_f32(float32x4_t __p0, float32x4_t __p1) {
  26532   float32x4_t __ret;
  26533   __ret = (float32x4_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  26534   return __ret;
  26535 }
  26536 #else
  26537 __ai __attribute__((target("neon"))) float32x4_t vrsqrtsq_f32(float32x4_t __p0, float32x4_t __p1) {
  26538   float32x4_t __ret;
  26539   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  26540   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  26541   __ret = (float32x4_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  26542   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  26543   return __ret;
  26544 }
  26545 #endif
  26546 
  26547 #ifdef __LITTLE_ENDIAN__
  26548 __ai __attribute__((target("neon"))) float32x2_t vrsqrts_f32(float32x2_t __p0, float32x2_t __p1) {
  26549   float32x2_t __ret;
  26550   __ret = (float32x2_t) __builtin_neon_vrsqrts_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  26551   return __ret;
  26552 }
  26553 #else
  26554 __ai __attribute__((target("neon"))) float32x2_t vrsqrts_f32(float32x2_t __p0, float32x2_t __p1) {
  26555   float32x2_t __ret;
  26556   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  26557   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  26558   __ret = (float32x2_t) __builtin_neon_vrsqrts_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  26559   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  26560   return __ret;
  26561 }
  26562 #endif
  26563 
  26564 #ifdef __LITTLE_ENDIAN__
  26565 #define vrsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  26566   uint8x16_t __ret; \
  26567   uint8x16_t __s0 = __p0; \
  26568   uint8x16_t __s1 = __p1; \
  26569   __ret = (uint8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
  26570   __ret; \
  26571 })
  26572 #else
  26573 #define vrsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  26574   uint8x16_t __ret; \
  26575   uint8x16_t __s0 = __p0; \
  26576   uint8x16_t __s1 = __p1; \
  26577   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26578   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26579   __ret = (uint8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  26580   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26581   __ret; \
  26582 })
  26583 #endif
  26584 
  26585 #ifdef __LITTLE_ENDIAN__
  26586 #define vrsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  26587   uint32x4_t __ret; \
  26588   uint32x4_t __s0 = __p0; \
  26589   uint32x4_t __s1 = __p1; \
  26590   __ret = (uint32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \
  26591   __ret; \
  26592 })
  26593 #else
  26594 #define vrsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  26595   uint32x4_t __ret; \
  26596   uint32x4_t __s0 = __p0; \
  26597   uint32x4_t __s1 = __p1; \
  26598   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26599   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  26600   __ret = (uint32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \
  26601   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26602   __ret; \
  26603 })
  26604 #endif
  26605 
  26606 #ifdef __LITTLE_ENDIAN__
  26607 #define vrsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  26608   uint64x2_t __ret; \
  26609   uint64x2_t __s0 = __p0; \
  26610   uint64x2_t __s1 = __p1; \
  26611   __ret = (uint64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \
  26612   __ret; \
  26613 })
  26614 #else
  26615 #define vrsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  26616   uint64x2_t __ret; \
  26617   uint64x2_t __s0 = __p0; \
  26618   uint64x2_t __s1 = __p1; \
  26619   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26620   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  26621   __ret = (uint64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \
  26622   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26623   __ret; \
  26624 })
  26625 #endif
  26626 
  26627 #ifdef __LITTLE_ENDIAN__
  26628 #define vrsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  26629   uint16x8_t __ret; \
  26630   uint16x8_t __s0 = __p0; \
  26631   uint16x8_t __s1 = __p1; \
  26632   __ret = (uint16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \
  26633   __ret; \
  26634 })
  26635 #else
  26636 #define vrsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  26637   uint16x8_t __ret; \
  26638   uint16x8_t __s0 = __p0; \
  26639   uint16x8_t __s1 = __p1; \
  26640   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26641   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  26642   __ret = (uint16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
  26643   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26644   __ret; \
  26645 })
  26646 #endif
  26647 
  26648 #ifdef __LITTLE_ENDIAN__
  26649 #define vrsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  26650   int8x16_t __ret; \
  26651   int8x16_t __s0 = __p0; \
  26652   int8x16_t __s1 = __p1; \
  26653   __ret = (int8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  26654   __ret; \
  26655 })
  26656 #else
  26657 #define vrsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  26658   int8x16_t __ret; \
  26659   int8x16_t __s0 = __p0; \
  26660   int8x16_t __s1 = __p1; \
  26661   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26662   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26663   __ret = (int8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  26664   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  26665   __ret; \
  26666 })
  26667 #endif
  26668 
  26669 #ifdef __LITTLE_ENDIAN__
  26670 #define vrsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  26671   int32x4_t __ret; \
  26672   int32x4_t __s0 = __p0; \
  26673   int32x4_t __s1 = __p1; \
  26674   __ret = (int32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  26675   __ret; \
  26676 })
  26677 #else
  26678 #define vrsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  26679   int32x4_t __ret; \
  26680   int32x4_t __s0 = __p0; \
  26681   int32x4_t __s1 = __p1; \
  26682   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26683   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  26684   __ret = (int32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  26685   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26686   __ret; \
  26687 })
  26688 #endif
  26689 
  26690 #ifdef __LITTLE_ENDIAN__
  26691 #define vrsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  26692   int64x2_t __ret; \
  26693   int64x2_t __s0 = __p0; \
  26694   int64x2_t __s1 = __p1; \
  26695   __ret = (int64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \
  26696   __ret; \
  26697 })
  26698 #else
  26699 #define vrsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  26700   int64x2_t __ret; \
  26701   int64x2_t __s0 = __p0; \
  26702   int64x2_t __s1 = __p1; \
  26703   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26704   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  26705   __ret = (int64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \
  26706   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26707   __ret; \
  26708 })
  26709 #endif
  26710 
  26711 #ifdef __LITTLE_ENDIAN__
  26712 #define vrsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  26713   int16x8_t __ret; \
  26714   int16x8_t __s0 = __p0; \
  26715   int16x8_t __s1 = __p1; \
  26716   __ret = (int16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  26717   __ret; \
  26718 })
  26719 #else
  26720 #define vrsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  26721   int16x8_t __ret; \
  26722   int16x8_t __s0 = __p0; \
  26723   int16x8_t __s1 = __p1; \
  26724   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26725   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  26726   __ret = (int16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  26727   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26728   __ret; \
  26729 })
  26730 #endif
  26731 
  26732 #ifdef __LITTLE_ENDIAN__
  26733 #define vrsra_n_u8(__p0, __p1, __p2) __extension__ ({ \
  26734   uint8x8_t __ret; \
  26735   uint8x8_t __s0 = __p0; \
  26736   uint8x8_t __s1 = __p1; \
  26737   __ret = (uint8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \
  26738   __ret; \
  26739 })
  26740 #else
  26741 #define vrsra_n_u8(__p0, __p1, __p2) __extension__ ({ \
  26742   uint8x8_t __ret; \
  26743   uint8x8_t __s0 = __p0; \
  26744   uint8x8_t __s1 = __p1; \
  26745   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26746   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  26747   __ret = (uint8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \
  26748   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26749   __ret; \
  26750 })
  26751 #endif
  26752 
  26753 #ifdef __LITTLE_ENDIAN__
  26754 #define vrsra_n_u32(__p0, __p1, __p2) __extension__ ({ \
  26755   uint32x2_t __ret; \
  26756   uint32x2_t __s0 = __p0; \
  26757   uint32x2_t __s1 = __p1; \
  26758   __ret = (uint32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \
  26759   __ret; \
  26760 })
  26761 #else
  26762 #define vrsra_n_u32(__p0, __p1, __p2) __extension__ ({ \
  26763   uint32x2_t __ret; \
  26764   uint32x2_t __s0 = __p0; \
  26765   uint32x2_t __s1 = __p1; \
  26766   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26767   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  26768   __ret = (uint32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \
  26769   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26770   __ret; \
  26771 })
  26772 #endif
  26773 
  26774 #define vrsra_n_u64(__p0, __p1, __p2) __extension__ ({ \
  26775   uint64x1_t __ret; \
  26776   uint64x1_t __s0 = __p0; \
  26777   uint64x1_t __s1 = __p1; \
  26778   __ret = (uint64x1_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \
  26779   __ret; \
  26780 })
  26781 #ifdef __LITTLE_ENDIAN__
  26782 #define vrsra_n_u16(__p0, __p1, __p2) __extension__ ({ \
  26783   uint16x4_t __ret; \
  26784   uint16x4_t __s0 = __p0; \
  26785   uint16x4_t __s1 = __p1; \
  26786   __ret = (uint16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \
  26787   __ret; \
  26788 })
  26789 #else
  26790 #define vrsra_n_u16(__p0, __p1, __p2) __extension__ ({ \
  26791   uint16x4_t __ret; \
  26792   uint16x4_t __s0 = __p0; \
  26793   uint16x4_t __s1 = __p1; \
  26794   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26795   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  26796   __ret = (uint16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \
  26797   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26798   __ret; \
  26799 })
  26800 #endif
  26801 
  26802 #ifdef __LITTLE_ENDIAN__
  26803 #define vrsra_n_s8(__p0, __p1, __p2) __extension__ ({ \
  26804   int8x8_t __ret; \
  26805   int8x8_t __s0 = __p0; \
  26806   int8x8_t __s1 = __p1; \
  26807   __ret = (int8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \
  26808   __ret; \
  26809 })
  26810 #else
  26811 #define vrsra_n_s8(__p0, __p1, __p2) __extension__ ({ \
  26812   int8x8_t __ret; \
  26813   int8x8_t __s0 = __p0; \
  26814   int8x8_t __s1 = __p1; \
  26815   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  26816   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  26817   __ret = (int8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \
  26818   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  26819   __ret; \
  26820 })
  26821 #endif
  26822 
  26823 #ifdef __LITTLE_ENDIAN__
  26824 #define vrsra_n_s32(__p0, __p1, __p2) __extension__ ({ \
  26825   int32x2_t __ret; \
  26826   int32x2_t __s0 = __p0; \
  26827   int32x2_t __s1 = __p1; \
  26828   __ret = (int32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  26829   __ret; \
  26830 })
  26831 #else
  26832 #define vrsra_n_s32(__p0, __p1, __p2) __extension__ ({ \
  26833   int32x2_t __ret; \
  26834   int32x2_t __s0 = __p0; \
  26835   int32x2_t __s1 = __p1; \
  26836   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  26837   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  26838   __ret = (int32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  26839   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  26840   __ret; \
  26841 })
  26842 #endif
  26843 
  26844 #define vrsra_n_s64(__p0, __p1, __p2) __extension__ ({ \
  26845   int64x1_t __ret; \
  26846   int64x1_t __s0 = __p0; \
  26847   int64x1_t __s1 = __p1; \
  26848   __ret = (int64x1_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \
  26849   __ret; \
  26850 })
  26851 #ifdef __LITTLE_ENDIAN__
  26852 #define vrsra_n_s16(__p0, __p1, __p2) __extension__ ({ \
  26853   int16x4_t __ret; \
  26854   int16x4_t __s0 = __p0; \
  26855   int16x4_t __s1 = __p1; \
  26856   __ret = (int16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  26857   __ret; \
  26858 })
  26859 #else
  26860 #define vrsra_n_s16(__p0, __p1, __p2) __extension__ ({ \
  26861   int16x4_t __ret; \
  26862   int16x4_t __s0 = __p0; \
  26863   int16x4_t __s1 = __p1; \
  26864   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  26865   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  26866   __ret = (int16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  26867   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  26868   __ret; \
  26869 })
  26870 #endif
  26871 
  26872 #ifdef __LITTLE_ENDIAN__
  26873 __ai __attribute__((target("neon"))) uint16x4_t vrsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  26874   uint16x4_t __ret;
  26875   __ret = (uint16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
  26876   return __ret;
  26877 }
  26878 #else
  26879 __ai __attribute__((target("neon"))) uint16x4_t vrsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  26880   uint16x4_t __ret;
  26881   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  26882   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  26883   __ret = (uint16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17);
  26884   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  26885   return __ret;
  26886 }
  26887 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vrsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  26888   uint16x4_t __ret;
  26889   __ret = (uint16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
  26890   return __ret;
  26891 }
  26892 #endif
  26893 
  26894 #ifdef __LITTLE_ENDIAN__
  26895 __ai __attribute__((target("neon"))) uint32x2_t vrsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  26896   uint32x2_t __ret;
  26897   __ret = (uint32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
  26898   return __ret;
  26899 }
  26900 #else
  26901 __ai __attribute__((target("neon"))) uint32x2_t vrsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  26902   uint32x2_t __ret;
  26903   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  26904   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  26905   __ret = (uint32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18);
  26906   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  26907   return __ret;
  26908 }
  26909 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vrsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  26910   uint32x2_t __ret;
  26911   __ret = (uint32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
  26912   return __ret;
  26913 }
  26914 #endif
  26915 
  26916 #ifdef __LITTLE_ENDIAN__
  26917 __ai __attribute__((target("neon"))) uint8x8_t vrsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  26918   uint8x8_t __ret;
  26919   __ret = (uint8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
  26920   return __ret;
  26921 }
  26922 #else
  26923 __ai __attribute__((target("neon"))) uint8x8_t vrsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  26924   uint8x8_t __ret;
  26925   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  26926   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  26927   __ret = (uint8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16);
  26928   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  26929   return __ret;
  26930 }
  26931 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vrsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  26932   uint8x8_t __ret;
  26933   __ret = (uint8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
  26934   return __ret;
  26935 }
  26936 #endif
  26937 
  26938 #ifdef __LITTLE_ENDIAN__
  26939 __ai __attribute__((target("neon"))) int16x4_t vrsubhn_s32(int32x4_t __p0, int32x4_t __p1) {
  26940   int16x4_t __ret;
  26941   __ret = (int16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
  26942   return __ret;
  26943 }
  26944 #else
  26945 __ai __attribute__((target("neon"))) int16x4_t vrsubhn_s32(int32x4_t __p0, int32x4_t __p1) {
  26946   int16x4_t __ret;
  26947   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  26948   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  26949   __ret = (int16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1);
  26950   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  26951   return __ret;
  26952 }
  26953 __ai __attribute__((target("neon"))) int16x4_t __noswap_vrsubhn_s32(int32x4_t __p0, int32x4_t __p1) {
  26954   int16x4_t __ret;
  26955   __ret = (int16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
  26956   return __ret;
  26957 }
  26958 #endif
  26959 
  26960 #ifdef __LITTLE_ENDIAN__
  26961 __ai __attribute__((target("neon"))) int32x2_t vrsubhn_s64(int64x2_t __p0, int64x2_t __p1) {
  26962   int32x2_t __ret;
  26963   __ret = (int32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
  26964   return __ret;
  26965 }
  26966 #else
  26967 __ai __attribute__((target("neon"))) int32x2_t vrsubhn_s64(int64x2_t __p0, int64x2_t __p1) {
  26968   int32x2_t __ret;
  26969   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  26970   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  26971   __ret = (int32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2);
  26972   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  26973   return __ret;
  26974 }
  26975 __ai __attribute__((target("neon"))) int32x2_t __noswap_vrsubhn_s64(int64x2_t __p0, int64x2_t __p1) {
  26976   int32x2_t __ret;
  26977   __ret = (int32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
  26978   return __ret;
  26979 }
  26980 #endif
  26981 
  26982 #ifdef __LITTLE_ENDIAN__
  26983 __ai __attribute__((target("neon"))) int8x8_t vrsubhn_s16(int16x8_t __p0, int16x8_t __p1) {
  26984   int8x8_t __ret;
  26985   __ret = (int8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
  26986   return __ret;
  26987 }
  26988 #else
  26989 __ai __attribute__((target("neon"))) int8x8_t vrsubhn_s16(int16x8_t __p0, int16x8_t __p1) {
  26990   int8x8_t __ret;
  26991   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  26992   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  26993   __ret = (int8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0);
  26994   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  26995   return __ret;
  26996 }
  26997 __ai __attribute__((target("neon"))) int8x8_t __noswap_vrsubhn_s16(int16x8_t __p0, int16x8_t __p1) {
  26998   int8x8_t __ret;
  26999   __ret = (int8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
  27000   return __ret;
  27001 }
  27002 #endif
  27003 
  27004 #ifdef __LITTLE_ENDIAN__
  27005 #define vset_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  27006   poly8x8_t __ret; \
  27007   poly8_t __s0 = __p0; \
  27008   poly8x8_t __s1 = __p1; \
  27009   __ret = (poly8x8_t) __builtin_neon_vset_lane_i8(__s0, (poly8x8_t)__s1, __p2); \
  27010   __ret; \
  27011 })
  27012 #else
  27013 #define vset_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  27014   poly8x8_t __ret; \
  27015   poly8_t __s0 = __p0; \
  27016   poly8x8_t __s1 = __p1; \
  27017   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  27018   __ret = (poly8x8_t) __builtin_neon_vset_lane_i8(__s0, (poly8x8_t)__rev1, __p2); \
  27019   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27020   __ret; \
  27021 })
  27022 #define __noswap_vset_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  27023   poly8x8_t __ret; \
  27024   poly8_t __s0 = __p0; \
  27025   poly8x8_t __s1 = __p1; \
  27026   __ret = (poly8x8_t) __builtin_neon_vset_lane_i8(__s0, (poly8x8_t)__s1, __p2); \
  27027   __ret; \
  27028 })
  27029 #endif
  27030 
  27031 #ifdef __LITTLE_ENDIAN__
  27032 #define vset_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  27033   poly16x4_t __ret; \
  27034   poly16_t __s0 = __p0; \
  27035   poly16x4_t __s1 = __p1; \
  27036   __ret = (poly16x4_t) __builtin_neon_vset_lane_i16(__s0, (poly16x4_t)__s1, __p2); \
  27037   __ret; \
  27038 })
  27039 #else
  27040 #define vset_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  27041   poly16x4_t __ret; \
  27042   poly16_t __s0 = __p0; \
  27043   poly16x4_t __s1 = __p1; \
  27044   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  27045   __ret = (poly16x4_t) __builtin_neon_vset_lane_i16(__s0, (poly16x4_t)__rev1, __p2); \
  27046   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27047   __ret; \
  27048 })
  27049 #define __noswap_vset_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  27050   poly16x4_t __ret; \
  27051   poly16_t __s0 = __p0; \
  27052   poly16x4_t __s1 = __p1; \
  27053   __ret = (poly16x4_t) __builtin_neon_vset_lane_i16(__s0, (poly16x4_t)__s1, __p2); \
  27054   __ret; \
  27055 })
  27056 #endif
  27057 
  27058 #ifdef __LITTLE_ENDIAN__
  27059 #define vsetq_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  27060   poly8x16_t __ret; \
  27061   poly8_t __s0 = __p0; \
  27062   poly8x16_t __s1 = __p1; \
  27063   __ret = (poly8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (poly8x16_t)__s1, __p2); \
  27064   __ret; \
  27065 })
  27066 #else
  27067 #define vsetq_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  27068   poly8x16_t __ret; \
  27069   poly8_t __s0 = __p0; \
  27070   poly8x16_t __s1 = __p1; \
  27071   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27072   __ret = (poly8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (poly8x16_t)__rev1, __p2); \
  27073   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27074   __ret; \
  27075 })
  27076 #define __noswap_vsetq_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  27077   poly8x16_t __ret; \
  27078   poly8_t __s0 = __p0; \
  27079   poly8x16_t __s1 = __p1; \
  27080   __ret = (poly8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (poly8x16_t)__s1, __p2); \
  27081   __ret; \
  27082 })
  27083 #endif
  27084 
  27085 #ifdef __LITTLE_ENDIAN__
  27086 #define vsetq_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  27087   poly16x8_t __ret; \
  27088   poly16_t __s0 = __p0; \
  27089   poly16x8_t __s1 = __p1; \
  27090   __ret = (poly16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (poly16x8_t)__s1, __p2); \
  27091   __ret; \
  27092 })
  27093 #else
  27094 #define vsetq_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  27095   poly16x8_t __ret; \
  27096   poly16_t __s0 = __p0; \
  27097   poly16x8_t __s1 = __p1; \
  27098   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  27099   __ret = (poly16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (poly16x8_t)__rev1, __p2); \
  27100   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27101   __ret; \
  27102 })
  27103 #define __noswap_vsetq_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  27104   poly16x8_t __ret; \
  27105   poly16_t __s0 = __p0; \
  27106   poly16x8_t __s1 = __p1; \
  27107   __ret = (poly16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (poly16x8_t)__s1, __p2); \
  27108   __ret; \
  27109 })
  27110 #endif
  27111 
  27112 #ifdef __LITTLE_ENDIAN__
  27113 #define vsetq_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  27114   uint8x16_t __ret; \
  27115   uint8_t __s0 = __p0; \
  27116   uint8x16_t __s1 = __p1; \
  27117   __ret = (uint8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \
  27118   __ret; \
  27119 })
  27120 #else
  27121 #define vsetq_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  27122   uint8x16_t __ret; \
  27123   uint8_t __s0 = __p0; \
  27124   uint8x16_t __s1 = __p1; \
  27125   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27126   __ret = (uint8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__rev1, __p2); \
  27127   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27128   __ret; \
  27129 })
  27130 #define __noswap_vsetq_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  27131   uint8x16_t __ret; \
  27132   uint8_t __s0 = __p0; \
  27133   uint8x16_t __s1 = __p1; \
  27134   __ret = (uint8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \
  27135   __ret; \
  27136 })
  27137 #endif
  27138 
  27139 #ifdef __LITTLE_ENDIAN__
  27140 #define vsetq_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  27141   uint32x4_t __ret; \
  27142   uint32_t __s0 = __p0; \
  27143   uint32x4_t __s1 = __p1; \
  27144   __ret = (uint32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \
  27145   __ret; \
  27146 })
  27147 #else
  27148 #define vsetq_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  27149   uint32x4_t __ret; \
  27150   uint32_t __s0 = __p0; \
  27151   uint32x4_t __s1 = __p1; \
  27152   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  27153   __ret = (uint32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__rev1, __p2); \
  27154   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27155   __ret; \
  27156 })
  27157 #define __noswap_vsetq_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  27158   uint32x4_t __ret; \
  27159   uint32_t __s0 = __p0; \
  27160   uint32x4_t __s1 = __p1; \
  27161   __ret = (uint32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \
  27162   __ret; \
  27163 })
  27164 #endif
  27165 
  27166 #ifdef __LITTLE_ENDIAN__
  27167 #define vsetq_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  27168   uint64x2_t __ret; \
  27169   uint64_t __s0 = __p0; \
  27170   uint64x2_t __s1 = __p1; \
  27171   __ret = (uint64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \
  27172   __ret; \
  27173 })
  27174 #else
  27175 #define vsetq_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  27176   uint64x2_t __ret; \
  27177   uint64_t __s0 = __p0; \
  27178   uint64x2_t __s1 = __p1; \
  27179   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  27180   __ret = (uint64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__rev1, __p2); \
  27181   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27182   __ret; \
  27183 })
  27184 #define __noswap_vsetq_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  27185   uint64x2_t __ret; \
  27186   uint64_t __s0 = __p0; \
  27187   uint64x2_t __s1 = __p1; \
  27188   __ret = (uint64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \
  27189   __ret; \
  27190 })
  27191 #endif
  27192 
  27193 #ifdef __LITTLE_ENDIAN__
  27194 #define vsetq_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  27195   uint16x8_t __ret; \
  27196   uint16_t __s0 = __p0; \
  27197   uint16x8_t __s1 = __p1; \
  27198   __ret = (uint16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \
  27199   __ret; \
  27200 })
  27201 #else
  27202 #define vsetq_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  27203   uint16x8_t __ret; \
  27204   uint16_t __s0 = __p0; \
  27205   uint16x8_t __s1 = __p1; \
  27206   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  27207   __ret = (uint16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__rev1, __p2); \
  27208   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27209   __ret; \
  27210 })
  27211 #define __noswap_vsetq_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  27212   uint16x8_t __ret; \
  27213   uint16_t __s0 = __p0; \
  27214   uint16x8_t __s1 = __p1; \
  27215   __ret = (uint16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \
  27216   __ret; \
  27217 })
  27218 #endif
  27219 
  27220 #ifdef __LITTLE_ENDIAN__
  27221 #define vsetq_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  27222   int8x16_t __ret; \
  27223   int8_t __s0 = __p0; \
  27224   int8x16_t __s1 = __p1; \
  27225   __ret = (int8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \
  27226   __ret; \
  27227 })
  27228 #else
  27229 #define vsetq_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  27230   int8x16_t __ret; \
  27231   int8_t __s0 = __p0; \
  27232   int8x16_t __s1 = __p1; \
  27233   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27234   __ret = (int8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__rev1, __p2); \
  27235   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27236   __ret; \
  27237 })
  27238 #define __noswap_vsetq_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  27239   int8x16_t __ret; \
  27240   int8_t __s0 = __p0; \
  27241   int8x16_t __s1 = __p1; \
  27242   __ret = (int8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \
  27243   __ret; \
  27244 })
  27245 #endif
  27246 
  27247 #ifdef __LITTLE_ENDIAN__
  27248 #define vsetq_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  27249   float32x4_t __ret; \
  27250   float32_t __s0 = __p0; \
  27251   float32x4_t __s1 = __p1; \
  27252   __ret = (float32x4_t) __builtin_neon_vsetq_lane_f32(__s0, (float32x4_t)__s1, __p2); \
  27253   __ret; \
  27254 })
  27255 #else
  27256 #define vsetq_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  27257   float32x4_t __ret; \
  27258   float32_t __s0 = __p0; \
  27259   float32x4_t __s1 = __p1; \
  27260   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  27261   __ret = (float32x4_t) __builtin_neon_vsetq_lane_f32(__s0, (float32x4_t)__rev1, __p2); \
  27262   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27263   __ret; \
  27264 })
  27265 #define __noswap_vsetq_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  27266   float32x4_t __ret; \
  27267   float32_t __s0 = __p0; \
  27268   float32x4_t __s1 = __p1; \
  27269   __ret = (float32x4_t) __builtin_neon_vsetq_lane_f32(__s0, (float32x4_t)__s1, __p2); \
  27270   __ret; \
  27271 })
  27272 #endif
  27273 
  27274 #ifdef __LITTLE_ENDIAN__
  27275 #define vsetq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  27276   int32x4_t __ret; \
  27277   int32_t __s0 = __p0; \
  27278   int32x4_t __s1 = __p1; \
  27279   __ret = (int32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \
  27280   __ret; \
  27281 })
  27282 #else
  27283 #define vsetq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  27284   int32x4_t __ret; \
  27285   int32_t __s0 = __p0; \
  27286   int32x4_t __s1 = __p1; \
  27287   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  27288   __ret = (int32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__rev1, __p2); \
  27289   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27290   __ret; \
  27291 })
  27292 #define __noswap_vsetq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  27293   int32x4_t __ret; \
  27294   int32_t __s0 = __p0; \
  27295   int32x4_t __s1 = __p1; \
  27296   __ret = (int32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \
  27297   __ret; \
  27298 })
  27299 #endif
  27300 
  27301 #ifdef __LITTLE_ENDIAN__
  27302 #define vsetq_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  27303   int64x2_t __ret; \
  27304   int64_t __s0 = __p0; \
  27305   int64x2_t __s1 = __p1; \
  27306   __ret = (int64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \
  27307   __ret; \
  27308 })
  27309 #else
  27310 #define vsetq_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  27311   int64x2_t __ret; \
  27312   int64_t __s0 = __p0; \
  27313   int64x2_t __s1 = __p1; \
  27314   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  27315   __ret = (int64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__rev1, __p2); \
  27316   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27317   __ret; \
  27318 })
  27319 #define __noswap_vsetq_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  27320   int64x2_t __ret; \
  27321   int64_t __s0 = __p0; \
  27322   int64x2_t __s1 = __p1; \
  27323   __ret = (int64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \
  27324   __ret; \
  27325 })
  27326 #endif
  27327 
  27328 #ifdef __LITTLE_ENDIAN__
  27329 #define vsetq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  27330   int16x8_t __ret; \
  27331   int16_t __s0 = __p0; \
  27332   int16x8_t __s1 = __p1; \
  27333   __ret = (int16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \
  27334   __ret; \
  27335 })
  27336 #else
  27337 #define vsetq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  27338   int16x8_t __ret; \
  27339   int16_t __s0 = __p0; \
  27340   int16x8_t __s1 = __p1; \
  27341   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  27342   __ret = (int16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__rev1, __p2); \
  27343   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27344   __ret; \
  27345 })
  27346 #define __noswap_vsetq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  27347   int16x8_t __ret; \
  27348   int16_t __s0 = __p0; \
  27349   int16x8_t __s1 = __p1; \
  27350   __ret = (int16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \
  27351   __ret; \
  27352 })
  27353 #endif
  27354 
  27355 #ifdef __LITTLE_ENDIAN__
  27356 #define vset_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  27357   uint8x8_t __ret; \
  27358   uint8_t __s0 = __p0; \
  27359   uint8x8_t __s1 = __p1; \
  27360   __ret = (uint8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \
  27361   __ret; \
  27362 })
  27363 #else
  27364 #define vset_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  27365   uint8x8_t __ret; \
  27366   uint8_t __s0 = __p0; \
  27367   uint8x8_t __s1 = __p1; \
  27368   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  27369   __ret = (uint8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__rev1, __p2); \
  27370   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27371   __ret; \
  27372 })
  27373 #define __noswap_vset_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  27374   uint8x8_t __ret; \
  27375   uint8_t __s0 = __p0; \
  27376   uint8x8_t __s1 = __p1; \
  27377   __ret = (uint8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \
  27378   __ret; \
  27379 })
  27380 #endif
  27381 
  27382 #ifdef __LITTLE_ENDIAN__
  27383 #define vset_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  27384   uint32x2_t __ret; \
  27385   uint32_t __s0 = __p0; \
  27386   uint32x2_t __s1 = __p1; \
  27387   __ret = (uint32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \
  27388   __ret; \
  27389 })
  27390 #else
  27391 #define vset_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  27392   uint32x2_t __ret; \
  27393   uint32_t __s0 = __p0; \
  27394   uint32x2_t __s1 = __p1; \
  27395   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  27396   __ret = (uint32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__rev1, __p2); \
  27397   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27398   __ret; \
  27399 })
  27400 #define __noswap_vset_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  27401   uint32x2_t __ret; \
  27402   uint32_t __s0 = __p0; \
  27403   uint32x2_t __s1 = __p1; \
  27404   __ret = (uint32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \
  27405   __ret; \
  27406 })
  27407 #endif
  27408 
  27409 #define vset_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  27410   uint64x1_t __ret; \
  27411   uint64_t __s0 = __p0; \
  27412   uint64x1_t __s1 = __p1; \
  27413   __ret = (uint64x1_t) __builtin_neon_vset_lane_i64(__s0, (int64x1_t)__s1, __p2); \
  27414   __ret; \
  27415 })
  27416 #ifdef __LITTLE_ENDIAN__
  27417 #define vset_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  27418   uint16x4_t __ret; \
  27419   uint16_t __s0 = __p0; \
  27420   uint16x4_t __s1 = __p1; \
  27421   __ret = (uint16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \
  27422   __ret; \
  27423 })
  27424 #else
  27425 #define vset_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  27426   uint16x4_t __ret; \
  27427   uint16_t __s0 = __p0; \
  27428   uint16x4_t __s1 = __p1; \
  27429   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  27430   __ret = (uint16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__rev1, __p2); \
  27431   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27432   __ret; \
  27433 })
  27434 #define __noswap_vset_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  27435   uint16x4_t __ret; \
  27436   uint16_t __s0 = __p0; \
  27437   uint16x4_t __s1 = __p1; \
  27438   __ret = (uint16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \
  27439   __ret; \
  27440 })
  27441 #endif
  27442 
  27443 #ifdef __LITTLE_ENDIAN__
  27444 #define vset_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  27445   int8x8_t __ret; \
  27446   int8_t __s0 = __p0; \
  27447   int8x8_t __s1 = __p1; \
  27448   __ret = (int8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \
  27449   __ret; \
  27450 })
  27451 #else
  27452 #define vset_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  27453   int8x8_t __ret; \
  27454   int8_t __s0 = __p0; \
  27455   int8x8_t __s1 = __p1; \
  27456   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  27457   __ret = (int8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__rev1, __p2); \
  27458   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27459   __ret; \
  27460 })
  27461 #define __noswap_vset_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  27462   int8x8_t __ret; \
  27463   int8_t __s0 = __p0; \
  27464   int8x8_t __s1 = __p1; \
  27465   __ret = (int8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \
  27466   __ret; \
  27467 })
  27468 #endif
  27469 
  27470 #ifdef __LITTLE_ENDIAN__
  27471 #define vset_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  27472   float32x2_t __ret; \
  27473   float32_t __s0 = __p0; \
  27474   float32x2_t __s1 = __p1; \
  27475   __ret = (float32x2_t) __builtin_neon_vset_lane_f32(__s0, (float32x2_t)__s1, __p2); \
  27476   __ret; \
  27477 })
  27478 #else
  27479 #define vset_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  27480   float32x2_t __ret; \
  27481   float32_t __s0 = __p0; \
  27482   float32x2_t __s1 = __p1; \
  27483   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  27484   __ret = (float32x2_t) __builtin_neon_vset_lane_f32(__s0, (float32x2_t)__rev1, __p2); \
  27485   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27486   __ret; \
  27487 })
  27488 #define __noswap_vset_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  27489   float32x2_t __ret; \
  27490   float32_t __s0 = __p0; \
  27491   float32x2_t __s1 = __p1; \
  27492   __ret = (float32x2_t) __builtin_neon_vset_lane_f32(__s0, (float32x2_t)__s1, __p2); \
  27493   __ret; \
  27494 })
  27495 #endif
  27496 
  27497 #ifdef __LITTLE_ENDIAN__
  27498 #define vset_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  27499   int32x2_t __ret; \
  27500   int32_t __s0 = __p0; \
  27501   int32x2_t __s1 = __p1; \
  27502   __ret = (int32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \
  27503   __ret; \
  27504 })
  27505 #else
  27506 #define vset_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  27507   int32x2_t __ret; \
  27508   int32_t __s0 = __p0; \
  27509   int32x2_t __s1 = __p1; \
  27510   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  27511   __ret = (int32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__rev1, __p2); \
  27512   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27513   __ret; \
  27514 })
  27515 #define __noswap_vset_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  27516   int32x2_t __ret; \
  27517   int32_t __s0 = __p0; \
  27518   int32x2_t __s1 = __p1; \
  27519   __ret = (int32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \
  27520   __ret; \
  27521 })
  27522 #endif
  27523 
  27524 #define vset_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  27525   int64x1_t __ret; \
  27526   int64_t __s0 = __p0; \
  27527   int64x1_t __s1 = __p1; \
  27528   __ret = (int64x1_t) __builtin_neon_vset_lane_i64(__s0, (int64x1_t)__s1, __p2); \
  27529   __ret; \
  27530 })
  27531 #ifdef __LITTLE_ENDIAN__
  27532 #define vset_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  27533   int16x4_t __ret; \
  27534   int16_t __s0 = __p0; \
  27535   int16x4_t __s1 = __p1; \
  27536   __ret = (int16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \
  27537   __ret; \
  27538 })
  27539 #else
  27540 #define vset_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  27541   int16x4_t __ret; \
  27542   int16_t __s0 = __p0; \
  27543   int16x4_t __s1 = __p1; \
  27544   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  27545   __ret = (int16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__rev1, __p2); \
  27546   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27547   __ret; \
  27548 })
  27549 #define __noswap_vset_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  27550   int16x4_t __ret; \
  27551   int16_t __s0 = __p0; \
  27552   int16x4_t __s1 = __p1; \
  27553   __ret = (int16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \
  27554   __ret; \
  27555 })
  27556 #endif
  27557 
  27558 #ifdef __LITTLE_ENDIAN__
  27559 __ai __attribute__((target("neon"))) uint8x16_t vshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  27560   uint8x16_t __ret;
  27561   __ret = (uint8x16_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  27562   return __ret;
  27563 }
  27564 #else
  27565 __ai __attribute__((target("neon"))) uint8x16_t vshlq_u8(uint8x16_t __p0, int8x16_t __p1) {
  27566   uint8x16_t __ret;
  27567   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  27568   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  27569   __ret = (uint8x16_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  27570   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  27571   return __ret;
  27572 }
  27573 #endif
  27574 
  27575 #ifdef __LITTLE_ENDIAN__
  27576 __ai __attribute__((target("neon"))) uint32x4_t vshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  27577   uint32x4_t __ret;
  27578   __ret = (uint32x4_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  27579   return __ret;
  27580 }
  27581 #else
  27582 __ai __attribute__((target("neon"))) uint32x4_t vshlq_u32(uint32x4_t __p0, int32x4_t __p1) {
  27583   uint32x4_t __ret;
  27584   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  27585   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  27586   __ret = (uint32x4_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  27587   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  27588   return __ret;
  27589 }
  27590 #endif
  27591 
  27592 #ifdef __LITTLE_ENDIAN__
  27593 __ai __attribute__((target("neon"))) uint64x2_t vshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  27594   uint64x2_t __ret;
  27595   __ret = (uint64x2_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  27596   return __ret;
  27597 }
  27598 #else
  27599 __ai __attribute__((target("neon"))) uint64x2_t vshlq_u64(uint64x2_t __p0, int64x2_t __p1) {
  27600   uint64x2_t __ret;
  27601   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  27602   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  27603   __ret = (uint64x2_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  27604   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  27605   return __ret;
  27606 }
  27607 #endif
  27608 
  27609 #ifdef __LITTLE_ENDIAN__
  27610 __ai __attribute__((target("neon"))) uint16x8_t vshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  27611   uint16x8_t __ret;
  27612   __ret = (uint16x8_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  27613   return __ret;
  27614 }
  27615 #else
  27616 __ai __attribute__((target("neon"))) uint16x8_t vshlq_u16(uint16x8_t __p0, int16x8_t __p1) {
  27617   uint16x8_t __ret;
  27618   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  27619   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  27620   __ret = (uint16x8_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  27621   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  27622   return __ret;
  27623 }
  27624 #endif
  27625 
  27626 #ifdef __LITTLE_ENDIAN__
  27627 __ai __attribute__((target("neon"))) int8x16_t vshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  27628   int8x16_t __ret;
  27629   __ret = (int8x16_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  27630   return __ret;
  27631 }
  27632 #else
  27633 __ai __attribute__((target("neon"))) int8x16_t vshlq_s8(int8x16_t __p0, int8x16_t __p1) {
  27634   int8x16_t __ret;
  27635   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  27636   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  27637   __ret = (int8x16_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  27638   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  27639   return __ret;
  27640 }
  27641 #endif
  27642 
  27643 #ifdef __LITTLE_ENDIAN__
  27644 __ai __attribute__((target("neon"))) int32x4_t vshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  27645   int32x4_t __ret;
  27646   __ret = (int32x4_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  27647   return __ret;
  27648 }
  27649 #else
  27650 __ai __attribute__((target("neon"))) int32x4_t vshlq_s32(int32x4_t __p0, int32x4_t __p1) {
  27651   int32x4_t __ret;
  27652   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  27653   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  27654   __ret = (int32x4_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  27655   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  27656   return __ret;
  27657 }
  27658 #endif
  27659 
  27660 #ifdef __LITTLE_ENDIAN__
  27661 __ai __attribute__((target("neon"))) int64x2_t vshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  27662   int64x2_t __ret;
  27663   __ret = (int64x2_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  27664   return __ret;
  27665 }
  27666 #else
  27667 __ai __attribute__((target("neon"))) int64x2_t vshlq_s64(int64x2_t __p0, int64x2_t __p1) {
  27668   int64x2_t __ret;
  27669   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  27670   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  27671   __ret = (int64x2_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  27672   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  27673   return __ret;
  27674 }
  27675 #endif
  27676 
  27677 #ifdef __LITTLE_ENDIAN__
  27678 __ai __attribute__((target("neon"))) int16x8_t vshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  27679   int16x8_t __ret;
  27680   __ret = (int16x8_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  27681   return __ret;
  27682 }
  27683 #else
  27684 __ai __attribute__((target("neon"))) int16x8_t vshlq_s16(int16x8_t __p0, int16x8_t __p1) {
  27685   int16x8_t __ret;
  27686   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  27687   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  27688   __ret = (int16x8_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  27689   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  27690   return __ret;
  27691 }
  27692 #endif
  27693 
  27694 #ifdef __LITTLE_ENDIAN__
  27695 __ai __attribute__((target("neon"))) uint8x8_t vshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  27696   uint8x8_t __ret;
  27697   __ret = (uint8x8_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  27698   return __ret;
  27699 }
  27700 #else
  27701 __ai __attribute__((target("neon"))) uint8x8_t vshl_u8(uint8x8_t __p0, int8x8_t __p1) {
  27702   uint8x8_t __ret;
  27703   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  27704   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  27705   __ret = (uint8x8_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  27706   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  27707   return __ret;
  27708 }
  27709 #endif
  27710 
  27711 #ifdef __LITTLE_ENDIAN__
  27712 __ai __attribute__((target("neon"))) uint32x2_t vshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  27713   uint32x2_t __ret;
  27714   __ret = (uint32x2_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  27715   return __ret;
  27716 }
  27717 #else
  27718 __ai __attribute__((target("neon"))) uint32x2_t vshl_u32(uint32x2_t __p0, int32x2_t __p1) {
  27719   uint32x2_t __ret;
  27720   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  27721   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  27722   __ret = (uint32x2_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  27723   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  27724   return __ret;
  27725 }
  27726 #endif
  27727 
  27728 __ai __attribute__((target("neon"))) uint64x1_t vshl_u64(uint64x1_t __p0, int64x1_t __p1) {
  27729   uint64x1_t __ret;
  27730   __ret = (uint64x1_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  27731   return __ret;
  27732 }
  27733 #ifdef __LITTLE_ENDIAN__
  27734 __ai __attribute__((target("neon"))) uint16x4_t vshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  27735   uint16x4_t __ret;
  27736   __ret = (uint16x4_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  27737   return __ret;
  27738 }
  27739 #else
  27740 __ai __attribute__((target("neon"))) uint16x4_t vshl_u16(uint16x4_t __p0, int16x4_t __p1) {
  27741   uint16x4_t __ret;
  27742   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  27743   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  27744   __ret = (uint16x4_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  27745   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  27746   return __ret;
  27747 }
  27748 #endif
  27749 
  27750 #ifdef __LITTLE_ENDIAN__
  27751 __ai __attribute__((target("neon"))) int8x8_t vshl_s8(int8x8_t __p0, int8x8_t __p1) {
  27752   int8x8_t __ret;
  27753   __ret = (int8x8_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  27754   return __ret;
  27755 }
  27756 #else
  27757 __ai __attribute__((target("neon"))) int8x8_t vshl_s8(int8x8_t __p0, int8x8_t __p1) {
  27758   int8x8_t __ret;
  27759   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  27760   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  27761   __ret = (int8x8_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  27762   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  27763   return __ret;
  27764 }
  27765 #endif
  27766 
  27767 #ifdef __LITTLE_ENDIAN__
  27768 __ai __attribute__((target("neon"))) int32x2_t vshl_s32(int32x2_t __p0, int32x2_t __p1) {
  27769   int32x2_t __ret;
  27770   __ret = (int32x2_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  27771   return __ret;
  27772 }
  27773 #else
  27774 __ai __attribute__((target("neon"))) int32x2_t vshl_s32(int32x2_t __p0, int32x2_t __p1) {
  27775   int32x2_t __ret;
  27776   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  27777   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  27778   __ret = (int32x2_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  27779   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  27780   return __ret;
  27781 }
  27782 #endif
  27783 
  27784 __ai __attribute__((target("neon"))) int64x1_t vshl_s64(int64x1_t __p0, int64x1_t __p1) {
  27785   int64x1_t __ret;
  27786   __ret = (int64x1_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  27787   return __ret;
  27788 }
  27789 #ifdef __LITTLE_ENDIAN__
  27790 __ai __attribute__((target("neon"))) int16x4_t vshl_s16(int16x4_t __p0, int16x4_t __p1) {
  27791   int16x4_t __ret;
  27792   __ret = (int16x4_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  27793   return __ret;
  27794 }
  27795 #else
  27796 __ai __attribute__((target("neon"))) int16x4_t vshl_s16(int16x4_t __p0, int16x4_t __p1) {
  27797   int16x4_t __ret;
  27798   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  27799   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  27800   __ret = (int16x4_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  27801   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  27802   return __ret;
  27803 }
  27804 #endif
  27805 
  27806 #ifdef __LITTLE_ENDIAN__
  27807 #define vshlq_n_u8(__p0, __p1) __extension__ ({ \
  27808   uint8x16_t __ret; \
  27809   uint8x16_t __s0 = __p0; \
  27810   __ret = (uint8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 48); \
  27811   __ret; \
  27812 })
  27813 #else
  27814 #define vshlq_n_u8(__p0, __p1) __extension__ ({ \
  27815   uint8x16_t __ret; \
  27816   uint8x16_t __s0 = __p0; \
  27817   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27818   __ret = (uint8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 48); \
  27819   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27820   __ret; \
  27821 })
  27822 #endif
  27823 
  27824 #ifdef __LITTLE_ENDIAN__
  27825 #define vshlq_n_u32(__p0, __p1) __extension__ ({ \
  27826   uint32x4_t __ret; \
  27827   uint32x4_t __s0 = __p0; \
  27828   __ret = (uint32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 50); \
  27829   __ret; \
  27830 })
  27831 #else
  27832 #define vshlq_n_u32(__p0, __p1) __extension__ ({ \
  27833   uint32x4_t __ret; \
  27834   uint32x4_t __s0 = __p0; \
  27835   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  27836   __ret = (uint32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 50); \
  27837   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27838   __ret; \
  27839 })
  27840 #endif
  27841 
  27842 #ifdef __LITTLE_ENDIAN__
  27843 #define vshlq_n_u64(__p0, __p1) __extension__ ({ \
  27844   uint64x2_t __ret; \
  27845   uint64x2_t __s0 = __p0; \
  27846   __ret = (uint64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 51); \
  27847   __ret; \
  27848 })
  27849 #else
  27850 #define vshlq_n_u64(__p0, __p1) __extension__ ({ \
  27851   uint64x2_t __ret; \
  27852   uint64x2_t __s0 = __p0; \
  27853   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  27854   __ret = (uint64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 51); \
  27855   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27856   __ret; \
  27857 })
  27858 #endif
  27859 
  27860 #ifdef __LITTLE_ENDIAN__
  27861 #define vshlq_n_u16(__p0, __p1) __extension__ ({ \
  27862   uint16x8_t __ret; \
  27863   uint16x8_t __s0 = __p0; \
  27864   __ret = (uint16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 49); \
  27865   __ret; \
  27866 })
  27867 #else
  27868 #define vshlq_n_u16(__p0, __p1) __extension__ ({ \
  27869   uint16x8_t __ret; \
  27870   uint16x8_t __s0 = __p0; \
  27871   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  27872   __ret = (uint16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 49); \
  27873   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27874   __ret; \
  27875 })
  27876 #endif
  27877 
  27878 #ifdef __LITTLE_ENDIAN__
  27879 #define vshlq_n_s8(__p0, __p1) __extension__ ({ \
  27880   int8x16_t __ret; \
  27881   int8x16_t __s0 = __p0; \
  27882   __ret = (int8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 32); \
  27883   __ret; \
  27884 })
  27885 #else
  27886 #define vshlq_n_s8(__p0, __p1) __extension__ ({ \
  27887   int8x16_t __ret; \
  27888   int8x16_t __s0 = __p0; \
  27889   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27890   __ret = (int8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 32); \
  27891   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  27892   __ret; \
  27893 })
  27894 #endif
  27895 
  27896 #ifdef __LITTLE_ENDIAN__
  27897 #define vshlq_n_s32(__p0, __p1) __extension__ ({ \
  27898   int32x4_t __ret; \
  27899   int32x4_t __s0 = __p0; \
  27900   __ret = (int32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 34); \
  27901   __ret; \
  27902 })
  27903 #else
  27904 #define vshlq_n_s32(__p0, __p1) __extension__ ({ \
  27905   int32x4_t __ret; \
  27906   int32x4_t __s0 = __p0; \
  27907   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  27908   __ret = (int32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 34); \
  27909   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  27910   __ret; \
  27911 })
  27912 #endif
  27913 
  27914 #ifdef __LITTLE_ENDIAN__
  27915 #define vshlq_n_s64(__p0, __p1) __extension__ ({ \
  27916   int64x2_t __ret; \
  27917   int64x2_t __s0 = __p0; \
  27918   __ret = (int64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 35); \
  27919   __ret; \
  27920 })
  27921 #else
  27922 #define vshlq_n_s64(__p0, __p1) __extension__ ({ \
  27923   int64x2_t __ret; \
  27924   int64x2_t __s0 = __p0; \
  27925   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  27926   __ret = (int64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 35); \
  27927   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27928   __ret; \
  27929 })
  27930 #endif
  27931 
  27932 #ifdef __LITTLE_ENDIAN__
  27933 #define vshlq_n_s16(__p0, __p1) __extension__ ({ \
  27934   int16x8_t __ret; \
  27935   int16x8_t __s0 = __p0; \
  27936   __ret = (int16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 33); \
  27937   __ret; \
  27938 })
  27939 #else
  27940 #define vshlq_n_s16(__p0, __p1) __extension__ ({ \
  27941   int16x8_t __ret; \
  27942   int16x8_t __s0 = __p0; \
  27943   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  27944   __ret = (int16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 33); \
  27945   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27946   __ret; \
  27947 })
  27948 #endif
  27949 
  27950 #ifdef __LITTLE_ENDIAN__
  27951 #define vshl_n_u8(__p0, __p1) __extension__ ({ \
  27952   uint8x8_t __ret; \
  27953   uint8x8_t __s0 = __p0; \
  27954   __ret = (uint8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 16); \
  27955   __ret; \
  27956 })
  27957 #else
  27958 #define vshl_n_u8(__p0, __p1) __extension__ ({ \
  27959   uint8x8_t __ret; \
  27960   uint8x8_t __s0 = __p0; \
  27961   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  27962   __ret = (uint8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 16); \
  27963   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  27964   __ret; \
  27965 })
  27966 #endif
  27967 
  27968 #ifdef __LITTLE_ENDIAN__
  27969 #define vshl_n_u32(__p0, __p1) __extension__ ({ \
  27970   uint32x2_t __ret; \
  27971   uint32x2_t __s0 = __p0; \
  27972   __ret = (uint32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 18); \
  27973   __ret; \
  27974 })
  27975 #else
  27976 #define vshl_n_u32(__p0, __p1) __extension__ ({ \
  27977   uint32x2_t __ret; \
  27978   uint32x2_t __s0 = __p0; \
  27979   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  27980   __ret = (uint32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 18); \
  27981   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  27982   __ret; \
  27983 })
  27984 #endif
  27985 
  27986 #define vshl_n_u64(__p0, __p1) __extension__ ({ \
  27987   uint64x1_t __ret; \
  27988   uint64x1_t __s0 = __p0; \
  27989   __ret = (uint64x1_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 19); \
  27990   __ret; \
  27991 })
  27992 #ifdef __LITTLE_ENDIAN__
  27993 #define vshl_n_u16(__p0, __p1) __extension__ ({ \
  27994   uint16x4_t __ret; \
  27995   uint16x4_t __s0 = __p0; \
  27996   __ret = (uint16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 17); \
  27997   __ret; \
  27998 })
  27999 #else
  28000 #define vshl_n_u16(__p0, __p1) __extension__ ({ \
  28001   uint16x4_t __ret; \
  28002   uint16x4_t __s0 = __p0; \
  28003   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28004   __ret = (uint16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 17); \
  28005   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28006   __ret; \
  28007 })
  28008 #endif
  28009 
  28010 #ifdef __LITTLE_ENDIAN__
  28011 #define vshl_n_s8(__p0, __p1) __extension__ ({ \
  28012   int8x8_t __ret; \
  28013   int8x8_t __s0 = __p0; \
  28014   __ret = (int8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 0); \
  28015   __ret; \
  28016 })
  28017 #else
  28018 #define vshl_n_s8(__p0, __p1) __extension__ ({ \
  28019   int8x8_t __ret; \
  28020   int8x8_t __s0 = __p0; \
  28021   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28022   __ret = (int8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 0); \
  28023   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28024   __ret; \
  28025 })
  28026 #endif
  28027 
  28028 #ifdef __LITTLE_ENDIAN__
  28029 #define vshl_n_s32(__p0, __p1) __extension__ ({ \
  28030   int32x2_t __ret; \
  28031   int32x2_t __s0 = __p0; \
  28032   __ret = (int32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 2); \
  28033   __ret; \
  28034 })
  28035 #else
  28036 #define vshl_n_s32(__p0, __p1) __extension__ ({ \
  28037   int32x2_t __ret; \
  28038   int32x2_t __s0 = __p0; \
  28039   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28040   __ret = (int32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 2); \
  28041   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28042   __ret; \
  28043 })
  28044 #endif
  28045 
  28046 #define vshl_n_s64(__p0, __p1) __extension__ ({ \
  28047   int64x1_t __ret; \
  28048   int64x1_t __s0 = __p0; \
  28049   __ret = (int64x1_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 3); \
  28050   __ret; \
  28051 })
  28052 #ifdef __LITTLE_ENDIAN__
  28053 #define vshl_n_s16(__p0, __p1) __extension__ ({ \
  28054   int16x4_t __ret; \
  28055   int16x4_t __s0 = __p0; \
  28056   __ret = (int16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 1); \
  28057   __ret; \
  28058 })
  28059 #else
  28060 #define vshl_n_s16(__p0, __p1) __extension__ ({ \
  28061   int16x4_t __ret; \
  28062   int16x4_t __s0 = __p0; \
  28063   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28064   __ret = (int16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 1); \
  28065   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28066   __ret; \
  28067 })
  28068 #endif
  28069 
  28070 #ifdef __LITTLE_ENDIAN__
  28071 #define vshll_n_u8(__p0, __p1) __extension__ ({ \
  28072   uint16x8_t __ret; \
  28073   uint8x8_t __s0 = __p0; \
  28074   __ret = (uint16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 49); \
  28075   __ret; \
  28076 })
  28077 #else
  28078 #define vshll_n_u8(__p0, __p1) __extension__ ({ \
  28079   uint16x8_t __ret; \
  28080   uint8x8_t __s0 = __p0; \
  28081   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28082   __ret = (uint16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 49); \
  28083   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28084   __ret; \
  28085 })
  28086 #define __noswap_vshll_n_u8(__p0, __p1) __extension__ ({ \
  28087   uint16x8_t __ret; \
  28088   uint8x8_t __s0 = __p0; \
  28089   __ret = (uint16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 49); \
  28090   __ret; \
  28091 })
  28092 #endif
  28093 
  28094 #ifdef __LITTLE_ENDIAN__
  28095 #define vshll_n_u32(__p0, __p1) __extension__ ({ \
  28096   uint64x2_t __ret; \
  28097   uint32x2_t __s0 = __p0; \
  28098   __ret = (uint64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 51); \
  28099   __ret; \
  28100 })
  28101 #else
  28102 #define vshll_n_u32(__p0, __p1) __extension__ ({ \
  28103   uint64x2_t __ret; \
  28104   uint32x2_t __s0 = __p0; \
  28105   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28106   __ret = (uint64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 51); \
  28107   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28108   __ret; \
  28109 })
  28110 #define __noswap_vshll_n_u32(__p0, __p1) __extension__ ({ \
  28111   uint64x2_t __ret; \
  28112   uint32x2_t __s0 = __p0; \
  28113   __ret = (uint64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 51); \
  28114   __ret; \
  28115 })
  28116 #endif
  28117 
  28118 #ifdef __LITTLE_ENDIAN__
  28119 #define vshll_n_u16(__p0, __p1) __extension__ ({ \
  28120   uint32x4_t __ret; \
  28121   uint16x4_t __s0 = __p0; \
  28122   __ret = (uint32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 50); \
  28123   __ret; \
  28124 })
  28125 #else
  28126 #define vshll_n_u16(__p0, __p1) __extension__ ({ \
  28127   uint32x4_t __ret; \
  28128   uint16x4_t __s0 = __p0; \
  28129   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28130   __ret = (uint32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 50); \
  28131   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28132   __ret; \
  28133 })
  28134 #define __noswap_vshll_n_u16(__p0, __p1) __extension__ ({ \
  28135   uint32x4_t __ret; \
  28136   uint16x4_t __s0 = __p0; \
  28137   __ret = (uint32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 50); \
  28138   __ret; \
  28139 })
  28140 #endif
  28141 
  28142 #ifdef __LITTLE_ENDIAN__
  28143 #define vshll_n_s8(__p0, __p1) __extension__ ({ \
  28144   int16x8_t __ret; \
  28145   int8x8_t __s0 = __p0; \
  28146   __ret = (int16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 33); \
  28147   __ret; \
  28148 })
  28149 #else
  28150 #define vshll_n_s8(__p0, __p1) __extension__ ({ \
  28151   int16x8_t __ret; \
  28152   int8x8_t __s0 = __p0; \
  28153   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28154   __ret = (int16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 33); \
  28155   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28156   __ret; \
  28157 })
  28158 #define __noswap_vshll_n_s8(__p0, __p1) __extension__ ({ \
  28159   int16x8_t __ret; \
  28160   int8x8_t __s0 = __p0; \
  28161   __ret = (int16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 33); \
  28162   __ret; \
  28163 })
  28164 #endif
  28165 
  28166 #ifdef __LITTLE_ENDIAN__
  28167 #define vshll_n_s32(__p0, __p1) __extension__ ({ \
  28168   int64x2_t __ret; \
  28169   int32x2_t __s0 = __p0; \
  28170   __ret = (int64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 35); \
  28171   __ret; \
  28172 })
  28173 #else
  28174 #define vshll_n_s32(__p0, __p1) __extension__ ({ \
  28175   int64x2_t __ret; \
  28176   int32x2_t __s0 = __p0; \
  28177   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28178   __ret = (int64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 35); \
  28179   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28180   __ret; \
  28181 })
  28182 #define __noswap_vshll_n_s32(__p0, __p1) __extension__ ({ \
  28183   int64x2_t __ret; \
  28184   int32x2_t __s0 = __p0; \
  28185   __ret = (int64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 35); \
  28186   __ret; \
  28187 })
  28188 #endif
  28189 
  28190 #ifdef __LITTLE_ENDIAN__
  28191 #define vshll_n_s16(__p0, __p1) __extension__ ({ \
  28192   int32x4_t __ret; \
  28193   int16x4_t __s0 = __p0; \
  28194   __ret = (int32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 34); \
  28195   __ret; \
  28196 })
  28197 #else
  28198 #define vshll_n_s16(__p0, __p1) __extension__ ({ \
  28199   int32x4_t __ret; \
  28200   int16x4_t __s0 = __p0; \
  28201   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28202   __ret = (int32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 34); \
  28203   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28204   __ret; \
  28205 })
  28206 #define __noswap_vshll_n_s16(__p0, __p1) __extension__ ({ \
  28207   int32x4_t __ret; \
  28208   int16x4_t __s0 = __p0; \
  28209   __ret = (int32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 34); \
  28210   __ret; \
  28211 })
  28212 #endif
  28213 
  28214 #ifdef __LITTLE_ENDIAN__
  28215 #define vshrq_n_u8(__p0, __p1) __extension__ ({ \
  28216   uint8x16_t __ret; \
  28217   uint8x16_t __s0 = __p0; \
  28218   __ret = (uint8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 48); \
  28219   __ret; \
  28220 })
  28221 #else
  28222 #define vshrq_n_u8(__p0, __p1) __extension__ ({ \
  28223   uint8x16_t __ret; \
  28224   uint8x16_t __s0 = __p0; \
  28225   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28226   __ret = (uint8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 48); \
  28227   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28228   __ret; \
  28229 })
  28230 #endif
  28231 
  28232 #ifdef __LITTLE_ENDIAN__
  28233 #define vshrq_n_u32(__p0, __p1) __extension__ ({ \
  28234   uint32x4_t __ret; \
  28235   uint32x4_t __s0 = __p0; \
  28236   __ret = (uint32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 50); \
  28237   __ret; \
  28238 })
  28239 #else
  28240 #define vshrq_n_u32(__p0, __p1) __extension__ ({ \
  28241   uint32x4_t __ret; \
  28242   uint32x4_t __s0 = __p0; \
  28243   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28244   __ret = (uint32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 50); \
  28245   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28246   __ret; \
  28247 })
  28248 #endif
  28249 
  28250 #ifdef __LITTLE_ENDIAN__
  28251 #define vshrq_n_u64(__p0, __p1) __extension__ ({ \
  28252   uint64x2_t __ret; \
  28253   uint64x2_t __s0 = __p0; \
  28254   __ret = (uint64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 51); \
  28255   __ret; \
  28256 })
  28257 #else
  28258 #define vshrq_n_u64(__p0, __p1) __extension__ ({ \
  28259   uint64x2_t __ret; \
  28260   uint64x2_t __s0 = __p0; \
  28261   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28262   __ret = (uint64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 51); \
  28263   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28264   __ret; \
  28265 })
  28266 #endif
  28267 
  28268 #ifdef __LITTLE_ENDIAN__
  28269 #define vshrq_n_u16(__p0, __p1) __extension__ ({ \
  28270   uint16x8_t __ret; \
  28271   uint16x8_t __s0 = __p0; \
  28272   __ret = (uint16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 49); \
  28273   __ret; \
  28274 })
  28275 #else
  28276 #define vshrq_n_u16(__p0, __p1) __extension__ ({ \
  28277   uint16x8_t __ret; \
  28278   uint16x8_t __s0 = __p0; \
  28279   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28280   __ret = (uint16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 49); \
  28281   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28282   __ret; \
  28283 })
  28284 #endif
  28285 
  28286 #ifdef __LITTLE_ENDIAN__
  28287 #define vshrq_n_s8(__p0, __p1) __extension__ ({ \
  28288   int8x16_t __ret; \
  28289   int8x16_t __s0 = __p0; \
  28290   __ret = (int8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 32); \
  28291   __ret; \
  28292 })
  28293 #else
  28294 #define vshrq_n_s8(__p0, __p1) __extension__ ({ \
  28295   int8x16_t __ret; \
  28296   int8x16_t __s0 = __p0; \
  28297   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28298   __ret = (int8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 32); \
  28299   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28300   __ret; \
  28301 })
  28302 #endif
  28303 
  28304 #ifdef __LITTLE_ENDIAN__
  28305 #define vshrq_n_s32(__p0, __p1) __extension__ ({ \
  28306   int32x4_t __ret; \
  28307   int32x4_t __s0 = __p0; \
  28308   __ret = (int32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 34); \
  28309   __ret; \
  28310 })
  28311 #else
  28312 #define vshrq_n_s32(__p0, __p1) __extension__ ({ \
  28313   int32x4_t __ret; \
  28314   int32x4_t __s0 = __p0; \
  28315   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28316   __ret = (int32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 34); \
  28317   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28318   __ret; \
  28319 })
  28320 #endif
  28321 
  28322 #ifdef __LITTLE_ENDIAN__
  28323 #define vshrq_n_s64(__p0, __p1) __extension__ ({ \
  28324   int64x2_t __ret; \
  28325   int64x2_t __s0 = __p0; \
  28326   __ret = (int64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 35); \
  28327   __ret; \
  28328 })
  28329 #else
  28330 #define vshrq_n_s64(__p0, __p1) __extension__ ({ \
  28331   int64x2_t __ret; \
  28332   int64x2_t __s0 = __p0; \
  28333   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28334   __ret = (int64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 35); \
  28335   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28336   __ret; \
  28337 })
  28338 #endif
  28339 
  28340 #ifdef __LITTLE_ENDIAN__
  28341 #define vshrq_n_s16(__p0, __p1) __extension__ ({ \
  28342   int16x8_t __ret; \
  28343   int16x8_t __s0 = __p0; \
  28344   __ret = (int16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 33); \
  28345   __ret; \
  28346 })
  28347 #else
  28348 #define vshrq_n_s16(__p0, __p1) __extension__ ({ \
  28349   int16x8_t __ret; \
  28350   int16x8_t __s0 = __p0; \
  28351   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28352   __ret = (int16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 33); \
  28353   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28354   __ret; \
  28355 })
  28356 #endif
  28357 
  28358 #ifdef __LITTLE_ENDIAN__
  28359 #define vshr_n_u8(__p0, __p1) __extension__ ({ \
  28360   uint8x8_t __ret; \
  28361   uint8x8_t __s0 = __p0; \
  28362   __ret = (uint8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 16); \
  28363   __ret; \
  28364 })
  28365 #else
  28366 #define vshr_n_u8(__p0, __p1) __extension__ ({ \
  28367   uint8x8_t __ret; \
  28368   uint8x8_t __s0 = __p0; \
  28369   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28370   __ret = (uint8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 16); \
  28371   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28372   __ret; \
  28373 })
  28374 #endif
  28375 
  28376 #ifdef __LITTLE_ENDIAN__
  28377 #define vshr_n_u32(__p0, __p1) __extension__ ({ \
  28378   uint32x2_t __ret; \
  28379   uint32x2_t __s0 = __p0; \
  28380   __ret = (uint32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 18); \
  28381   __ret; \
  28382 })
  28383 #else
  28384 #define vshr_n_u32(__p0, __p1) __extension__ ({ \
  28385   uint32x2_t __ret; \
  28386   uint32x2_t __s0 = __p0; \
  28387   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28388   __ret = (uint32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 18); \
  28389   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28390   __ret; \
  28391 })
  28392 #endif
  28393 
  28394 #define vshr_n_u64(__p0, __p1) __extension__ ({ \
  28395   uint64x1_t __ret; \
  28396   uint64x1_t __s0 = __p0; \
  28397   __ret = (uint64x1_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 19); \
  28398   __ret; \
  28399 })
  28400 #ifdef __LITTLE_ENDIAN__
  28401 #define vshr_n_u16(__p0, __p1) __extension__ ({ \
  28402   uint16x4_t __ret; \
  28403   uint16x4_t __s0 = __p0; \
  28404   __ret = (uint16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 17); \
  28405   __ret; \
  28406 })
  28407 #else
  28408 #define vshr_n_u16(__p0, __p1) __extension__ ({ \
  28409   uint16x4_t __ret; \
  28410   uint16x4_t __s0 = __p0; \
  28411   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28412   __ret = (uint16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 17); \
  28413   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28414   __ret; \
  28415 })
  28416 #endif
  28417 
  28418 #ifdef __LITTLE_ENDIAN__
  28419 #define vshr_n_s8(__p0, __p1) __extension__ ({ \
  28420   int8x8_t __ret; \
  28421   int8x8_t __s0 = __p0; \
  28422   __ret = (int8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 0); \
  28423   __ret; \
  28424 })
  28425 #else
  28426 #define vshr_n_s8(__p0, __p1) __extension__ ({ \
  28427   int8x8_t __ret; \
  28428   int8x8_t __s0 = __p0; \
  28429   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28430   __ret = (int8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 0); \
  28431   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28432   __ret; \
  28433 })
  28434 #endif
  28435 
  28436 #ifdef __LITTLE_ENDIAN__
  28437 #define vshr_n_s32(__p0, __p1) __extension__ ({ \
  28438   int32x2_t __ret; \
  28439   int32x2_t __s0 = __p0; \
  28440   __ret = (int32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 2); \
  28441   __ret; \
  28442 })
  28443 #else
  28444 #define vshr_n_s32(__p0, __p1) __extension__ ({ \
  28445   int32x2_t __ret; \
  28446   int32x2_t __s0 = __p0; \
  28447   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28448   __ret = (int32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 2); \
  28449   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28450   __ret; \
  28451 })
  28452 #endif
  28453 
  28454 #define vshr_n_s64(__p0, __p1) __extension__ ({ \
  28455   int64x1_t __ret; \
  28456   int64x1_t __s0 = __p0; \
  28457   __ret = (int64x1_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 3); \
  28458   __ret; \
  28459 })
  28460 #ifdef __LITTLE_ENDIAN__
  28461 #define vshr_n_s16(__p0, __p1) __extension__ ({ \
  28462   int16x4_t __ret; \
  28463   int16x4_t __s0 = __p0; \
  28464   __ret = (int16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 1); \
  28465   __ret; \
  28466 })
  28467 #else
  28468 #define vshr_n_s16(__p0, __p1) __extension__ ({ \
  28469   int16x4_t __ret; \
  28470   int16x4_t __s0 = __p0; \
  28471   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28472   __ret = (int16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 1); \
  28473   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28474   __ret; \
  28475 })
  28476 #endif
  28477 
  28478 #ifdef __LITTLE_ENDIAN__
  28479 #define vshrn_n_u32(__p0, __p1) __extension__ ({ \
  28480   uint16x4_t __ret; \
  28481   uint32x4_t __s0 = __p0; \
  28482   __ret = (uint16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 17); \
  28483   __ret; \
  28484 })
  28485 #else
  28486 #define vshrn_n_u32(__p0, __p1) __extension__ ({ \
  28487   uint16x4_t __ret; \
  28488   uint32x4_t __s0 = __p0; \
  28489   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28490   __ret = (uint16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 17); \
  28491   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28492   __ret; \
  28493 })
  28494 #define __noswap_vshrn_n_u32(__p0, __p1) __extension__ ({ \
  28495   uint16x4_t __ret; \
  28496   uint32x4_t __s0 = __p0; \
  28497   __ret = (uint16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 17); \
  28498   __ret; \
  28499 })
  28500 #endif
  28501 
  28502 #ifdef __LITTLE_ENDIAN__
  28503 #define vshrn_n_u64(__p0, __p1) __extension__ ({ \
  28504   uint32x2_t __ret; \
  28505   uint64x2_t __s0 = __p0; \
  28506   __ret = (uint32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 18); \
  28507   __ret; \
  28508 })
  28509 #else
  28510 #define vshrn_n_u64(__p0, __p1) __extension__ ({ \
  28511   uint32x2_t __ret; \
  28512   uint64x2_t __s0 = __p0; \
  28513   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28514   __ret = (uint32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 18); \
  28515   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28516   __ret; \
  28517 })
  28518 #define __noswap_vshrn_n_u64(__p0, __p1) __extension__ ({ \
  28519   uint32x2_t __ret; \
  28520   uint64x2_t __s0 = __p0; \
  28521   __ret = (uint32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 18); \
  28522   __ret; \
  28523 })
  28524 #endif
  28525 
  28526 #ifdef __LITTLE_ENDIAN__
  28527 #define vshrn_n_u16(__p0, __p1) __extension__ ({ \
  28528   uint8x8_t __ret; \
  28529   uint16x8_t __s0 = __p0; \
  28530   __ret = (uint8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 16); \
  28531   __ret; \
  28532 })
  28533 #else
  28534 #define vshrn_n_u16(__p0, __p1) __extension__ ({ \
  28535   uint8x8_t __ret; \
  28536   uint16x8_t __s0 = __p0; \
  28537   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28538   __ret = (uint8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 16); \
  28539   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28540   __ret; \
  28541 })
  28542 #define __noswap_vshrn_n_u16(__p0, __p1) __extension__ ({ \
  28543   uint8x8_t __ret; \
  28544   uint16x8_t __s0 = __p0; \
  28545   __ret = (uint8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 16); \
  28546   __ret; \
  28547 })
  28548 #endif
  28549 
  28550 #ifdef __LITTLE_ENDIAN__
  28551 #define vshrn_n_s32(__p0, __p1) __extension__ ({ \
  28552   int16x4_t __ret; \
  28553   int32x4_t __s0 = __p0; \
  28554   __ret = (int16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 1); \
  28555   __ret; \
  28556 })
  28557 #else
  28558 #define vshrn_n_s32(__p0, __p1) __extension__ ({ \
  28559   int16x4_t __ret; \
  28560   int32x4_t __s0 = __p0; \
  28561   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28562   __ret = (int16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 1); \
  28563   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28564   __ret; \
  28565 })
  28566 #define __noswap_vshrn_n_s32(__p0, __p1) __extension__ ({ \
  28567   int16x4_t __ret; \
  28568   int32x4_t __s0 = __p0; \
  28569   __ret = (int16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 1); \
  28570   __ret; \
  28571 })
  28572 #endif
  28573 
  28574 #ifdef __LITTLE_ENDIAN__
  28575 #define vshrn_n_s64(__p0, __p1) __extension__ ({ \
  28576   int32x2_t __ret; \
  28577   int64x2_t __s0 = __p0; \
  28578   __ret = (int32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 2); \
  28579   __ret; \
  28580 })
  28581 #else
  28582 #define vshrn_n_s64(__p0, __p1) __extension__ ({ \
  28583   int32x2_t __ret; \
  28584   int64x2_t __s0 = __p0; \
  28585   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28586   __ret = (int32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 2); \
  28587   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28588   __ret; \
  28589 })
  28590 #define __noswap_vshrn_n_s64(__p0, __p1) __extension__ ({ \
  28591   int32x2_t __ret; \
  28592   int64x2_t __s0 = __p0; \
  28593   __ret = (int32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 2); \
  28594   __ret; \
  28595 })
  28596 #endif
  28597 
  28598 #ifdef __LITTLE_ENDIAN__
  28599 #define vshrn_n_s16(__p0, __p1) __extension__ ({ \
  28600   int8x8_t __ret; \
  28601   int16x8_t __s0 = __p0; \
  28602   __ret = (int8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 0); \
  28603   __ret; \
  28604 })
  28605 #else
  28606 #define vshrn_n_s16(__p0, __p1) __extension__ ({ \
  28607   int8x8_t __ret; \
  28608   int16x8_t __s0 = __p0; \
  28609   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28610   __ret = (int8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 0); \
  28611   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28612   __ret; \
  28613 })
  28614 #define __noswap_vshrn_n_s16(__p0, __p1) __extension__ ({ \
  28615   int8x8_t __ret; \
  28616   int16x8_t __s0 = __p0; \
  28617   __ret = (int8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 0); \
  28618   __ret; \
  28619 })
  28620 #endif
  28621 
  28622 #ifdef __LITTLE_ENDIAN__
  28623 #define vsli_n_p8(__p0, __p1, __p2) __extension__ ({ \
  28624   poly8x8_t __ret; \
  28625   poly8x8_t __s0 = __p0; \
  28626   poly8x8_t __s1 = __p1; \
  28627   __ret = (poly8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 4); \
  28628   __ret; \
  28629 })
  28630 #else
  28631 #define vsli_n_p8(__p0, __p1, __p2) __extension__ ({ \
  28632   poly8x8_t __ret; \
  28633   poly8x8_t __s0 = __p0; \
  28634   poly8x8_t __s1 = __p1; \
  28635   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28636   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  28637   __ret = (poly8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 4); \
  28638   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28639   __ret; \
  28640 })
  28641 #endif
  28642 
  28643 #ifdef __LITTLE_ENDIAN__
  28644 #define vsli_n_p16(__p0, __p1, __p2) __extension__ ({ \
  28645   poly16x4_t __ret; \
  28646   poly16x4_t __s0 = __p0; \
  28647   poly16x4_t __s1 = __p1; \
  28648   __ret = (poly16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 5); \
  28649   __ret; \
  28650 })
  28651 #else
  28652 #define vsli_n_p16(__p0, __p1, __p2) __extension__ ({ \
  28653   poly16x4_t __ret; \
  28654   poly16x4_t __s0 = __p0; \
  28655   poly16x4_t __s1 = __p1; \
  28656   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28657   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  28658   __ret = (poly16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 5); \
  28659   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28660   __ret; \
  28661 })
  28662 #endif
  28663 
  28664 #ifdef __LITTLE_ENDIAN__
  28665 #define vsliq_n_p8(__p0, __p1, __p2) __extension__ ({ \
  28666   poly8x16_t __ret; \
  28667   poly8x16_t __s0 = __p0; \
  28668   poly8x16_t __s1 = __p1; \
  28669   __ret = (poly8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \
  28670   __ret; \
  28671 })
  28672 #else
  28673 #define vsliq_n_p8(__p0, __p1, __p2) __extension__ ({ \
  28674   poly8x16_t __ret; \
  28675   poly8x16_t __s0 = __p0; \
  28676   poly8x16_t __s1 = __p1; \
  28677   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28678   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28679   __ret = (poly8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \
  28680   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28681   __ret; \
  28682 })
  28683 #endif
  28684 
  28685 #ifdef __LITTLE_ENDIAN__
  28686 #define vsliq_n_p16(__p0, __p1, __p2) __extension__ ({ \
  28687   poly16x8_t __ret; \
  28688   poly16x8_t __s0 = __p0; \
  28689   poly16x8_t __s1 = __p1; \
  28690   __ret = (poly16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \
  28691   __ret; \
  28692 })
  28693 #else
  28694 #define vsliq_n_p16(__p0, __p1, __p2) __extension__ ({ \
  28695   poly16x8_t __ret; \
  28696   poly16x8_t __s0 = __p0; \
  28697   poly16x8_t __s1 = __p1; \
  28698   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28699   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  28700   __ret = (poly16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \
  28701   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28702   __ret; \
  28703 })
  28704 #endif
  28705 
  28706 #ifdef __LITTLE_ENDIAN__
  28707 #define vsliq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  28708   uint8x16_t __ret; \
  28709   uint8x16_t __s0 = __p0; \
  28710   uint8x16_t __s1 = __p1; \
  28711   __ret = (uint8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
  28712   __ret; \
  28713 })
  28714 #else
  28715 #define vsliq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  28716   uint8x16_t __ret; \
  28717   uint8x16_t __s0 = __p0; \
  28718   uint8x16_t __s1 = __p1; \
  28719   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28720   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28721   __ret = (uint8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  28722   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28723   __ret; \
  28724 })
  28725 #endif
  28726 
  28727 #ifdef __LITTLE_ENDIAN__
  28728 #define vsliq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  28729   uint32x4_t __ret; \
  28730   uint32x4_t __s0 = __p0; \
  28731   uint32x4_t __s1 = __p1; \
  28732   __ret = (uint32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \
  28733   __ret; \
  28734 })
  28735 #else
  28736 #define vsliq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  28737   uint32x4_t __ret; \
  28738   uint32x4_t __s0 = __p0; \
  28739   uint32x4_t __s1 = __p1; \
  28740   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28741   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  28742   __ret = (uint32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \
  28743   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28744   __ret; \
  28745 })
  28746 #endif
  28747 
  28748 #ifdef __LITTLE_ENDIAN__
  28749 #define vsliq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  28750   uint64x2_t __ret; \
  28751   uint64x2_t __s0 = __p0; \
  28752   uint64x2_t __s1 = __p1; \
  28753   __ret = (uint64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \
  28754   __ret; \
  28755 })
  28756 #else
  28757 #define vsliq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  28758   uint64x2_t __ret; \
  28759   uint64x2_t __s0 = __p0; \
  28760   uint64x2_t __s1 = __p1; \
  28761   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28762   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  28763   __ret = (uint64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \
  28764   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28765   __ret; \
  28766 })
  28767 #endif
  28768 
  28769 #ifdef __LITTLE_ENDIAN__
  28770 #define vsliq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  28771   uint16x8_t __ret; \
  28772   uint16x8_t __s0 = __p0; \
  28773   uint16x8_t __s1 = __p1; \
  28774   __ret = (uint16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \
  28775   __ret; \
  28776 })
  28777 #else
  28778 #define vsliq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  28779   uint16x8_t __ret; \
  28780   uint16x8_t __s0 = __p0; \
  28781   uint16x8_t __s1 = __p1; \
  28782   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28783   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  28784   __ret = (uint16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
  28785   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28786   __ret; \
  28787 })
  28788 #endif
  28789 
  28790 #ifdef __LITTLE_ENDIAN__
  28791 #define vsliq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  28792   int8x16_t __ret; \
  28793   int8x16_t __s0 = __p0; \
  28794   int8x16_t __s1 = __p1; \
  28795   __ret = (int8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  28796   __ret; \
  28797 })
  28798 #else
  28799 #define vsliq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  28800   int8x16_t __ret; \
  28801   int8x16_t __s0 = __p0; \
  28802   int8x16_t __s1 = __p1; \
  28803   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28804   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28805   __ret = (int8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  28806   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  28807   __ret; \
  28808 })
  28809 #endif
  28810 
  28811 #ifdef __LITTLE_ENDIAN__
  28812 #define vsliq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  28813   int32x4_t __ret; \
  28814   int32x4_t __s0 = __p0; \
  28815   int32x4_t __s1 = __p1; \
  28816   __ret = (int32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  28817   __ret; \
  28818 })
  28819 #else
  28820 #define vsliq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  28821   int32x4_t __ret; \
  28822   int32x4_t __s0 = __p0; \
  28823   int32x4_t __s1 = __p1; \
  28824   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28825   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  28826   __ret = (int32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  28827   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28828   __ret; \
  28829 })
  28830 #endif
  28831 
  28832 #ifdef __LITTLE_ENDIAN__
  28833 #define vsliq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  28834   int64x2_t __ret; \
  28835   int64x2_t __s0 = __p0; \
  28836   int64x2_t __s1 = __p1; \
  28837   __ret = (int64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \
  28838   __ret; \
  28839 })
  28840 #else
  28841 #define vsliq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  28842   int64x2_t __ret; \
  28843   int64x2_t __s0 = __p0; \
  28844   int64x2_t __s1 = __p1; \
  28845   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28846   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  28847   __ret = (int64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \
  28848   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28849   __ret; \
  28850 })
  28851 #endif
  28852 
  28853 #ifdef __LITTLE_ENDIAN__
  28854 #define vsliq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  28855   int16x8_t __ret; \
  28856   int16x8_t __s0 = __p0; \
  28857   int16x8_t __s1 = __p1; \
  28858   __ret = (int16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  28859   __ret; \
  28860 })
  28861 #else
  28862 #define vsliq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  28863   int16x8_t __ret; \
  28864   int16x8_t __s0 = __p0; \
  28865   int16x8_t __s1 = __p1; \
  28866   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28867   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  28868   __ret = (int16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  28869   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28870   __ret; \
  28871 })
  28872 #endif
  28873 
  28874 #ifdef __LITTLE_ENDIAN__
  28875 #define vsli_n_u8(__p0, __p1, __p2) __extension__ ({ \
  28876   uint8x8_t __ret; \
  28877   uint8x8_t __s0 = __p0; \
  28878   uint8x8_t __s1 = __p1; \
  28879   __ret = (uint8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \
  28880   __ret; \
  28881 })
  28882 #else
  28883 #define vsli_n_u8(__p0, __p1, __p2) __extension__ ({ \
  28884   uint8x8_t __ret; \
  28885   uint8x8_t __s0 = __p0; \
  28886   uint8x8_t __s1 = __p1; \
  28887   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28888   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  28889   __ret = (uint8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \
  28890   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28891   __ret; \
  28892 })
  28893 #endif
  28894 
  28895 #ifdef __LITTLE_ENDIAN__
  28896 #define vsli_n_u32(__p0, __p1, __p2) __extension__ ({ \
  28897   uint32x2_t __ret; \
  28898   uint32x2_t __s0 = __p0; \
  28899   uint32x2_t __s1 = __p1; \
  28900   __ret = (uint32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \
  28901   __ret; \
  28902 })
  28903 #else
  28904 #define vsli_n_u32(__p0, __p1, __p2) __extension__ ({ \
  28905   uint32x2_t __ret; \
  28906   uint32x2_t __s0 = __p0; \
  28907   uint32x2_t __s1 = __p1; \
  28908   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28909   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  28910   __ret = (uint32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \
  28911   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28912   __ret; \
  28913 })
  28914 #endif
  28915 
  28916 #define vsli_n_u64(__p0, __p1, __p2) __extension__ ({ \
  28917   uint64x1_t __ret; \
  28918   uint64x1_t __s0 = __p0; \
  28919   uint64x1_t __s1 = __p1; \
  28920   __ret = (uint64x1_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \
  28921   __ret; \
  28922 })
  28923 #ifdef __LITTLE_ENDIAN__
  28924 #define vsli_n_u16(__p0, __p1, __p2) __extension__ ({ \
  28925   uint16x4_t __ret; \
  28926   uint16x4_t __s0 = __p0; \
  28927   uint16x4_t __s1 = __p1; \
  28928   __ret = (uint16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \
  28929   __ret; \
  28930 })
  28931 #else
  28932 #define vsli_n_u16(__p0, __p1, __p2) __extension__ ({ \
  28933   uint16x4_t __ret; \
  28934   uint16x4_t __s0 = __p0; \
  28935   uint16x4_t __s1 = __p1; \
  28936   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  28937   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  28938   __ret = (uint16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \
  28939   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  28940   __ret; \
  28941 })
  28942 #endif
  28943 
  28944 #ifdef __LITTLE_ENDIAN__
  28945 #define vsli_n_s8(__p0, __p1, __p2) __extension__ ({ \
  28946   int8x8_t __ret; \
  28947   int8x8_t __s0 = __p0; \
  28948   int8x8_t __s1 = __p1; \
  28949   __ret = (int8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \
  28950   __ret; \
  28951 })
  28952 #else
  28953 #define vsli_n_s8(__p0, __p1, __p2) __extension__ ({ \
  28954   int8x8_t __ret; \
  28955   int8x8_t __s0 = __p0; \
  28956   int8x8_t __s1 = __p1; \
  28957   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  28958   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  28959   __ret = (int8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \
  28960   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  28961   __ret; \
  28962 })
  28963 #endif
  28964 
  28965 #ifdef __LITTLE_ENDIAN__
  28966 #define vsli_n_s32(__p0, __p1, __p2) __extension__ ({ \
  28967   int32x2_t __ret; \
  28968   int32x2_t __s0 = __p0; \
  28969   int32x2_t __s1 = __p1; \
  28970   __ret = (int32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  28971   __ret; \
  28972 })
  28973 #else
  28974 #define vsli_n_s32(__p0, __p1, __p2) __extension__ ({ \
  28975   int32x2_t __ret; \
  28976   int32x2_t __s0 = __p0; \
  28977   int32x2_t __s1 = __p1; \
  28978   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  28979   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  28980   __ret = (int32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  28981   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  28982   __ret; \
  28983 })
  28984 #endif
  28985 
  28986 #define vsli_n_s64(__p0, __p1, __p2) __extension__ ({ \
  28987   int64x1_t __ret; \
  28988   int64x1_t __s0 = __p0; \
  28989   int64x1_t __s1 = __p1; \
  28990   __ret = (int64x1_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \
  28991   __ret; \
  28992 })
  28993 #ifdef __LITTLE_ENDIAN__
  28994 #define vsli_n_s16(__p0, __p1, __p2) __extension__ ({ \
  28995   int16x4_t __ret; \
  28996   int16x4_t __s0 = __p0; \
  28997   int16x4_t __s1 = __p1; \
  28998   __ret = (int16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  28999   __ret; \
  29000 })
  29001 #else
  29002 #define vsli_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29003   int16x4_t __ret; \
  29004   int16x4_t __s0 = __p0; \
  29005   int16x4_t __s1 = __p1; \
  29006   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29007   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29008   __ret = (int16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  29009   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29010   __ret; \
  29011 })
  29012 #endif
  29013 
  29014 #ifdef __LITTLE_ENDIAN__
  29015 #define vsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29016   uint8x16_t __ret; \
  29017   uint8x16_t __s0 = __p0; \
  29018   uint8x16_t __s1 = __p1; \
  29019   __ret = (uint8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
  29020   __ret; \
  29021 })
  29022 #else
  29023 #define vsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29024   uint8x16_t __ret; \
  29025   uint8x16_t __s0 = __p0; \
  29026   uint8x16_t __s1 = __p1; \
  29027   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29028   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29029   __ret = (uint8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  29030   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29031   __ret; \
  29032 })
  29033 #endif
  29034 
  29035 #ifdef __LITTLE_ENDIAN__
  29036 #define vsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29037   uint32x4_t __ret; \
  29038   uint32x4_t __s0 = __p0; \
  29039   uint32x4_t __s1 = __p1; \
  29040   __ret = (uint32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \
  29041   __ret; \
  29042 })
  29043 #else
  29044 #define vsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29045   uint32x4_t __ret; \
  29046   uint32x4_t __s0 = __p0; \
  29047   uint32x4_t __s1 = __p1; \
  29048   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29049   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29050   __ret = (uint32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \
  29051   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29052   __ret; \
  29053 })
  29054 #endif
  29055 
  29056 #ifdef __LITTLE_ENDIAN__
  29057 #define vsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  29058   uint64x2_t __ret; \
  29059   uint64x2_t __s0 = __p0; \
  29060   uint64x2_t __s1 = __p1; \
  29061   __ret = (uint64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \
  29062   __ret; \
  29063 })
  29064 #else
  29065 #define vsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  29066   uint64x2_t __ret; \
  29067   uint64x2_t __s0 = __p0; \
  29068   uint64x2_t __s1 = __p1; \
  29069   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29070   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29071   __ret = (uint64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \
  29072   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29073   __ret; \
  29074 })
  29075 #endif
  29076 
  29077 #ifdef __LITTLE_ENDIAN__
  29078 #define vsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29079   uint16x8_t __ret; \
  29080   uint16x8_t __s0 = __p0; \
  29081   uint16x8_t __s1 = __p1; \
  29082   __ret = (uint16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \
  29083   __ret; \
  29084 })
  29085 #else
  29086 #define vsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29087   uint16x8_t __ret; \
  29088   uint16x8_t __s0 = __p0; \
  29089   uint16x8_t __s1 = __p1; \
  29090   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29091   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29092   __ret = (uint16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
  29093   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29094   __ret; \
  29095 })
  29096 #endif
  29097 
  29098 #ifdef __LITTLE_ENDIAN__
  29099 #define vsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29100   int8x16_t __ret; \
  29101   int8x16_t __s0 = __p0; \
  29102   int8x16_t __s1 = __p1; \
  29103   __ret = (int8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  29104   __ret; \
  29105 })
  29106 #else
  29107 #define vsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29108   int8x16_t __ret; \
  29109   int8x16_t __s0 = __p0; \
  29110   int8x16_t __s1 = __p1; \
  29111   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29112   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29113   __ret = (int8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  29114   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29115   __ret; \
  29116 })
  29117 #endif
  29118 
  29119 #ifdef __LITTLE_ENDIAN__
  29120 #define vsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29121   int32x4_t __ret; \
  29122   int32x4_t __s0 = __p0; \
  29123   int32x4_t __s1 = __p1; \
  29124   __ret = (int32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  29125   __ret; \
  29126 })
  29127 #else
  29128 #define vsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29129   int32x4_t __ret; \
  29130   int32x4_t __s0 = __p0; \
  29131   int32x4_t __s1 = __p1; \
  29132   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29133   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29134   __ret = (int32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  29135   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29136   __ret; \
  29137 })
  29138 #endif
  29139 
  29140 #ifdef __LITTLE_ENDIAN__
  29141 #define vsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  29142   int64x2_t __ret; \
  29143   int64x2_t __s0 = __p0; \
  29144   int64x2_t __s1 = __p1; \
  29145   __ret = (int64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \
  29146   __ret; \
  29147 })
  29148 #else
  29149 #define vsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  29150   int64x2_t __ret; \
  29151   int64x2_t __s0 = __p0; \
  29152   int64x2_t __s1 = __p1; \
  29153   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29154   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29155   __ret = (int64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \
  29156   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29157   __ret; \
  29158 })
  29159 #endif
  29160 
  29161 #ifdef __LITTLE_ENDIAN__
  29162 #define vsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29163   int16x8_t __ret; \
  29164   int16x8_t __s0 = __p0; \
  29165   int16x8_t __s1 = __p1; \
  29166   __ret = (int16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  29167   __ret; \
  29168 })
  29169 #else
  29170 #define vsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29171   int16x8_t __ret; \
  29172   int16x8_t __s0 = __p0; \
  29173   int16x8_t __s1 = __p1; \
  29174   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29175   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29176   __ret = (int16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  29177   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29178   __ret; \
  29179 })
  29180 #endif
  29181 
  29182 #ifdef __LITTLE_ENDIAN__
  29183 #define vsra_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29184   uint8x8_t __ret; \
  29185   uint8x8_t __s0 = __p0; \
  29186   uint8x8_t __s1 = __p1; \
  29187   __ret = (uint8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \
  29188   __ret; \
  29189 })
  29190 #else
  29191 #define vsra_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29192   uint8x8_t __ret; \
  29193   uint8x8_t __s0 = __p0; \
  29194   uint8x8_t __s1 = __p1; \
  29195   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29196   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29197   __ret = (uint8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \
  29198   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29199   __ret; \
  29200 })
  29201 #endif
  29202 
  29203 #ifdef __LITTLE_ENDIAN__
  29204 #define vsra_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29205   uint32x2_t __ret; \
  29206   uint32x2_t __s0 = __p0; \
  29207   uint32x2_t __s1 = __p1; \
  29208   __ret = (uint32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \
  29209   __ret; \
  29210 })
  29211 #else
  29212 #define vsra_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29213   uint32x2_t __ret; \
  29214   uint32x2_t __s0 = __p0; \
  29215   uint32x2_t __s1 = __p1; \
  29216   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29217   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29218   __ret = (uint32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \
  29219   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29220   __ret; \
  29221 })
  29222 #endif
  29223 
  29224 #define vsra_n_u64(__p0, __p1, __p2) __extension__ ({ \
  29225   uint64x1_t __ret; \
  29226   uint64x1_t __s0 = __p0; \
  29227   uint64x1_t __s1 = __p1; \
  29228   __ret = (uint64x1_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \
  29229   __ret; \
  29230 })
  29231 #ifdef __LITTLE_ENDIAN__
  29232 #define vsra_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29233   uint16x4_t __ret; \
  29234   uint16x4_t __s0 = __p0; \
  29235   uint16x4_t __s1 = __p1; \
  29236   __ret = (uint16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \
  29237   __ret; \
  29238 })
  29239 #else
  29240 #define vsra_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29241   uint16x4_t __ret; \
  29242   uint16x4_t __s0 = __p0; \
  29243   uint16x4_t __s1 = __p1; \
  29244   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29245   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29246   __ret = (uint16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \
  29247   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29248   __ret; \
  29249 })
  29250 #endif
  29251 
  29252 #ifdef __LITTLE_ENDIAN__
  29253 #define vsra_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29254   int8x8_t __ret; \
  29255   int8x8_t __s0 = __p0; \
  29256   int8x8_t __s1 = __p1; \
  29257   __ret = (int8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \
  29258   __ret; \
  29259 })
  29260 #else
  29261 #define vsra_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29262   int8x8_t __ret; \
  29263   int8x8_t __s0 = __p0; \
  29264   int8x8_t __s1 = __p1; \
  29265   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29266   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29267   __ret = (int8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \
  29268   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29269   __ret; \
  29270 })
  29271 #endif
  29272 
  29273 #ifdef __LITTLE_ENDIAN__
  29274 #define vsra_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29275   int32x2_t __ret; \
  29276   int32x2_t __s0 = __p0; \
  29277   int32x2_t __s1 = __p1; \
  29278   __ret = (int32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  29279   __ret; \
  29280 })
  29281 #else
  29282 #define vsra_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29283   int32x2_t __ret; \
  29284   int32x2_t __s0 = __p0; \
  29285   int32x2_t __s1 = __p1; \
  29286   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29287   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29288   __ret = (int32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  29289   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29290   __ret; \
  29291 })
  29292 #endif
  29293 
  29294 #define vsra_n_s64(__p0, __p1, __p2) __extension__ ({ \
  29295   int64x1_t __ret; \
  29296   int64x1_t __s0 = __p0; \
  29297   int64x1_t __s1 = __p1; \
  29298   __ret = (int64x1_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \
  29299   __ret; \
  29300 })
  29301 #ifdef __LITTLE_ENDIAN__
  29302 #define vsra_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29303   int16x4_t __ret; \
  29304   int16x4_t __s0 = __p0; \
  29305   int16x4_t __s1 = __p1; \
  29306   __ret = (int16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  29307   __ret; \
  29308 })
  29309 #else
  29310 #define vsra_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29311   int16x4_t __ret; \
  29312   int16x4_t __s0 = __p0; \
  29313   int16x4_t __s1 = __p1; \
  29314   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29315   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29316   __ret = (int16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  29317   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29318   __ret; \
  29319 })
  29320 #endif
  29321 
  29322 #ifdef __LITTLE_ENDIAN__
  29323 #define vsri_n_p8(__p0, __p1, __p2) __extension__ ({ \
  29324   poly8x8_t __ret; \
  29325   poly8x8_t __s0 = __p0; \
  29326   poly8x8_t __s1 = __p1; \
  29327   __ret = (poly8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 4); \
  29328   __ret; \
  29329 })
  29330 #else
  29331 #define vsri_n_p8(__p0, __p1, __p2) __extension__ ({ \
  29332   poly8x8_t __ret; \
  29333   poly8x8_t __s0 = __p0; \
  29334   poly8x8_t __s1 = __p1; \
  29335   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29336   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29337   __ret = (poly8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 4); \
  29338   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29339   __ret; \
  29340 })
  29341 #endif
  29342 
  29343 #ifdef __LITTLE_ENDIAN__
  29344 #define vsri_n_p16(__p0, __p1, __p2) __extension__ ({ \
  29345   poly16x4_t __ret; \
  29346   poly16x4_t __s0 = __p0; \
  29347   poly16x4_t __s1 = __p1; \
  29348   __ret = (poly16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 5); \
  29349   __ret; \
  29350 })
  29351 #else
  29352 #define vsri_n_p16(__p0, __p1, __p2) __extension__ ({ \
  29353   poly16x4_t __ret; \
  29354   poly16x4_t __s0 = __p0; \
  29355   poly16x4_t __s1 = __p1; \
  29356   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29357   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29358   __ret = (poly16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 5); \
  29359   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29360   __ret; \
  29361 })
  29362 #endif
  29363 
  29364 #ifdef __LITTLE_ENDIAN__
  29365 #define vsriq_n_p8(__p0, __p1, __p2) __extension__ ({ \
  29366   poly8x16_t __ret; \
  29367   poly8x16_t __s0 = __p0; \
  29368   poly8x16_t __s1 = __p1; \
  29369   __ret = (poly8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \
  29370   __ret; \
  29371 })
  29372 #else
  29373 #define vsriq_n_p8(__p0, __p1, __p2) __extension__ ({ \
  29374   poly8x16_t __ret; \
  29375   poly8x16_t __s0 = __p0; \
  29376   poly8x16_t __s1 = __p1; \
  29377   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29378   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29379   __ret = (poly8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \
  29380   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29381   __ret; \
  29382 })
  29383 #endif
  29384 
  29385 #ifdef __LITTLE_ENDIAN__
  29386 #define vsriq_n_p16(__p0, __p1, __p2) __extension__ ({ \
  29387   poly16x8_t __ret; \
  29388   poly16x8_t __s0 = __p0; \
  29389   poly16x8_t __s1 = __p1; \
  29390   __ret = (poly16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \
  29391   __ret; \
  29392 })
  29393 #else
  29394 #define vsriq_n_p16(__p0, __p1, __p2) __extension__ ({ \
  29395   poly16x8_t __ret; \
  29396   poly16x8_t __s0 = __p0; \
  29397   poly16x8_t __s1 = __p1; \
  29398   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29399   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29400   __ret = (poly16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \
  29401   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29402   __ret; \
  29403 })
  29404 #endif
  29405 
  29406 #ifdef __LITTLE_ENDIAN__
  29407 #define vsriq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29408   uint8x16_t __ret; \
  29409   uint8x16_t __s0 = __p0; \
  29410   uint8x16_t __s1 = __p1; \
  29411   __ret = (uint8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
  29412   __ret; \
  29413 })
  29414 #else
  29415 #define vsriq_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29416   uint8x16_t __ret; \
  29417   uint8x16_t __s0 = __p0; \
  29418   uint8x16_t __s1 = __p1; \
  29419   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29420   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29421   __ret = (uint8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  29422   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29423   __ret; \
  29424 })
  29425 #endif
  29426 
  29427 #ifdef __LITTLE_ENDIAN__
  29428 #define vsriq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29429   uint32x4_t __ret; \
  29430   uint32x4_t __s0 = __p0; \
  29431   uint32x4_t __s1 = __p1; \
  29432   __ret = (uint32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \
  29433   __ret; \
  29434 })
  29435 #else
  29436 #define vsriq_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29437   uint32x4_t __ret; \
  29438   uint32x4_t __s0 = __p0; \
  29439   uint32x4_t __s1 = __p1; \
  29440   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29441   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29442   __ret = (uint32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \
  29443   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29444   __ret; \
  29445 })
  29446 #endif
  29447 
  29448 #ifdef __LITTLE_ENDIAN__
  29449 #define vsriq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  29450   uint64x2_t __ret; \
  29451   uint64x2_t __s0 = __p0; \
  29452   uint64x2_t __s1 = __p1; \
  29453   __ret = (uint64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \
  29454   __ret; \
  29455 })
  29456 #else
  29457 #define vsriq_n_u64(__p0, __p1, __p2) __extension__ ({ \
  29458   uint64x2_t __ret; \
  29459   uint64x2_t __s0 = __p0; \
  29460   uint64x2_t __s1 = __p1; \
  29461   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29462   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29463   __ret = (uint64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \
  29464   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29465   __ret; \
  29466 })
  29467 #endif
  29468 
  29469 #ifdef __LITTLE_ENDIAN__
  29470 #define vsriq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29471   uint16x8_t __ret; \
  29472   uint16x8_t __s0 = __p0; \
  29473   uint16x8_t __s1 = __p1; \
  29474   __ret = (uint16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \
  29475   __ret; \
  29476 })
  29477 #else
  29478 #define vsriq_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29479   uint16x8_t __ret; \
  29480   uint16x8_t __s0 = __p0; \
  29481   uint16x8_t __s1 = __p1; \
  29482   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29483   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29484   __ret = (uint16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
  29485   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29486   __ret; \
  29487 })
  29488 #endif
  29489 
  29490 #ifdef __LITTLE_ENDIAN__
  29491 #define vsriq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29492   int8x16_t __ret; \
  29493   int8x16_t __s0 = __p0; \
  29494   int8x16_t __s1 = __p1; \
  29495   __ret = (int8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  29496   __ret; \
  29497 })
  29498 #else
  29499 #define vsriq_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29500   int8x16_t __ret; \
  29501   int8x16_t __s0 = __p0; \
  29502   int8x16_t __s1 = __p1; \
  29503   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29504   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29505   __ret = (int8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  29506   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29507   __ret; \
  29508 })
  29509 #endif
  29510 
  29511 #ifdef __LITTLE_ENDIAN__
  29512 #define vsriq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29513   int32x4_t __ret; \
  29514   int32x4_t __s0 = __p0; \
  29515   int32x4_t __s1 = __p1; \
  29516   __ret = (int32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  29517   __ret; \
  29518 })
  29519 #else
  29520 #define vsriq_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29521   int32x4_t __ret; \
  29522   int32x4_t __s0 = __p0; \
  29523   int32x4_t __s1 = __p1; \
  29524   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29525   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29526   __ret = (int32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  29527   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29528   __ret; \
  29529 })
  29530 #endif
  29531 
  29532 #ifdef __LITTLE_ENDIAN__
  29533 #define vsriq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  29534   int64x2_t __ret; \
  29535   int64x2_t __s0 = __p0; \
  29536   int64x2_t __s1 = __p1; \
  29537   __ret = (int64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \
  29538   __ret; \
  29539 })
  29540 #else
  29541 #define vsriq_n_s64(__p0, __p1, __p2) __extension__ ({ \
  29542   int64x2_t __ret; \
  29543   int64x2_t __s0 = __p0; \
  29544   int64x2_t __s1 = __p1; \
  29545   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29546   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29547   __ret = (int64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \
  29548   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29549   __ret; \
  29550 })
  29551 #endif
  29552 
  29553 #ifdef __LITTLE_ENDIAN__
  29554 #define vsriq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29555   int16x8_t __ret; \
  29556   int16x8_t __s0 = __p0; \
  29557   int16x8_t __s1 = __p1; \
  29558   __ret = (int16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  29559   __ret; \
  29560 })
  29561 #else
  29562 #define vsriq_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29563   int16x8_t __ret; \
  29564   int16x8_t __s0 = __p0; \
  29565   int16x8_t __s1 = __p1; \
  29566   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29567   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29568   __ret = (int16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  29569   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29570   __ret; \
  29571 })
  29572 #endif
  29573 
  29574 #ifdef __LITTLE_ENDIAN__
  29575 #define vsri_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29576   uint8x8_t __ret; \
  29577   uint8x8_t __s0 = __p0; \
  29578   uint8x8_t __s1 = __p1; \
  29579   __ret = (uint8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \
  29580   __ret; \
  29581 })
  29582 #else
  29583 #define vsri_n_u8(__p0, __p1, __p2) __extension__ ({ \
  29584   uint8x8_t __ret; \
  29585   uint8x8_t __s0 = __p0; \
  29586   uint8x8_t __s1 = __p1; \
  29587   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29588   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29589   __ret = (uint8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \
  29590   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29591   __ret; \
  29592 })
  29593 #endif
  29594 
  29595 #ifdef __LITTLE_ENDIAN__
  29596 #define vsri_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29597   uint32x2_t __ret; \
  29598   uint32x2_t __s0 = __p0; \
  29599   uint32x2_t __s1 = __p1; \
  29600   __ret = (uint32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \
  29601   __ret; \
  29602 })
  29603 #else
  29604 #define vsri_n_u32(__p0, __p1, __p2) __extension__ ({ \
  29605   uint32x2_t __ret; \
  29606   uint32x2_t __s0 = __p0; \
  29607   uint32x2_t __s1 = __p1; \
  29608   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29609   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29610   __ret = (uint32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \
  29611   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29612   __ret; \
  29613 })
  29614 #endif
  29615 
  29616 #define vsri_n_u64(__p0, __p1, __p2) __extension__ ({ \
  29617   uint64x1_t __ret; \
  29618   uint64x1_t __s0 = __p0; \
  29619   uint64x1_t __s1 = __p1; \
  29620   __ret = (uint64x1_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \
  29621   __ret; \
  29622 })
  29623 #ifdef __LITTLE_ENDIAN__
  29624 #define vsri_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29625   uint16x4_t __ret; \
  29626   uint16x4_t __s0 = __p0; \
  29627   uint16x4_t __s1 = __p1; \
  29628   __ret = (uint16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \
  29629   __ret; \
  29630 })
  29631 #else
  29632 #define vsri_n_u16(__p0, __p1, __p2) __extension__ ({ \
  29633   uint16x4_t __ret; \
  29634   uint16x4_t __s0 = __p0; \
  29635   uint16x4_t __s1 = __p1; \
  29636   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29637   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29638   __ret = (uint16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \
  29639   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29640   __ret; \
  29641 })
  29642 #endif
  29643 
  29644 #ifdef __LITTLE_ENDIAN__
  29645 #define vsri_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29646   int8x8_t __ret; \
  29647   int8x8_t __s0 = __p0; \
  29648   int8x8_t __s1 = __p1; \
  29649   __ret = (int8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \
  29650   __ret; \
  29651 })
  29652 #else
  29653 #define vsri_n_s8(__p0, __p1, __p2) __extension__ ({ \
  29654   int8x8_t __ret; \
  29655   int8x8_t __s0 = __p0; \
  29656   int8x8_t __s1 = __p1; \
  29657   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  29658   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29659   __ret = (int8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \
  29660   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  29661   __ret; \
  29662 })
  29663 #endif
  29664 
  29665 #ifdef __LITTLE_ENDIAN__
  29666 #define vsri_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29667   int32x2_t __ret; \
  29668   int32x2_t __s0 = __p0; \
  29669   int32x2_t __s1 = __p1; \
  29670   __ret = (int32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  29671   __ret; \
  29672 })
  29673 #else
  29674 #define vsri_n_s32(__p0, __p1, __p2) __extension__ ({ \
  29675   int32x2_t __ret; \
  29676   int32x2_t __s0 = __p0; \
  29677   int32x2_t __s1 = __p1; \
  29678   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  29679   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29680   __ret = (int32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  29681   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  29682   __ret; \
  29683 })
  29684 #endif
  29685 
  29686 #define vsri_n_s64(__p0, __p1, __p2) __extension__ ({ \
  29687   int64x1_t __ret; \
  29688   int64x1_t __s0 = __p0; \
  29689   int64x1_t __s1 = __p1; \
  29690   __ret = (int64x1_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \
  29691   __ret; \
  29692 })
  29693 #ifdef __LITTLE_ENDIAN__
  29694 #define vsri_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29695   int16x4_t __ret; \
  29696   int16x4_t __s0 = __p0; \
  29697   int16x4_t __s1 = __p1; \
  29698   __ret = (int16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  29699   __ret; \
  29700 })
  29701 #else
  29702 #define vsri_n_s16(__p0, __p1, __p2) __extension__ ({ \
  29703   int16x4_t __ret; \
  29704   int16x4_t __s0 = __p0; \
  29705   int16x4_t __s1 = __p1; \
  29706   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  29707   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29708   __ret = (int16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  29709   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  29710   __ret; \
  29711 })
  29712 #endif
  29713 
  29714 #ifdef __LITTLE_ENDIAN__
  29715 #define vst1_p8(__p0, __p1) __extension__ ({ \
  29716   poly8x8_t __s1 = __p1; \
  29717   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 4); \
  29718 })
  29719 #else
  29720 #define vst1_p8(__p0, __p1) __extension__ ({ \
  29721   poly8x8_t __s1 = __p1; \
  29722   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29723   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 4); \
  29724 })
  29725 #endif
  29726 
  29727 #ifdef __LITTLE_ENDIAN__
  29728 #define vst1_p16(__p0, __p1) __extension__ ({ \
  29729   poly16x4_t __s1 = __p1; \
  29730   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 5); \
  29731 })
  29732 #else
  29733 #define vst1_p16(__p0, __p1) __extension__ ({ \
  29734   poly16x4_t __s1 = __p1; \
  29735   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29736   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 5); \
  29737 })
  29738 #endif
  29739 
  29740 #ifdef __LITTLE_ENDIAN__
  29741 #define vst1q_p8(__p0, __p1) __extension__ ({ \
  29742   poly8x16_t __s1 = __p1; \
  29743   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 36); \
  29744 })
  29745 #else
  29746 #define vst1q_p8(__p0, __p1) __extension__ ({ \
  29747   poly8x16_t __s1 = __p1; \
  29748   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29749   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 36); \
  29750 })
  29751 #endif
  29752 
  29753 #ifdef __LITTLE_ENDIAN__
  29754 #define vst1q_p16(__p0, __p1) __extension__ ({ \
  29755   poly16x8_t __s1 = __p1; \
  29756   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 37); \
  29757 })
  29758 #else
  29759 #define vst1q_p16(__p0, __p1) __extension__ ({ \
  29760   poly16x8_t __s1 = __p1; \
  29761   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29762   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 37); \
  29763 })
  29764 #endif
  29765 
  29766 #ifdef __LITTLE_ENDIAN__
  29767 #define vst1q_u8(__p0, __p1) __extension__ ({ \
  29768   uint8x16_t __s1 = __p1; \
  29769   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 48); \
  29770 })
  29771 #else
  29772 #define vst1q_u8(__p0, __p1) __extension__ ({ \
  29773   uint8x16_t __s1 = __p1; \
  29774   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29775   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 48); \
  29776 })
  29777 #endif
  29778 
  29779 #ifdef __LITTLE_ENDIAN__
  29780 #define vst1q_u32(__p0, __p1) __extension__ ({ \
  29781   uint32x4_t __s1 = __p1; \
  29782   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 50); \
  29783 })
  29784 #else
  29785 #define vst1q_u32(__p0, __p1) __extension__ ({ \
  29786   uint32x4_t __s1 = __p1; \
  29787   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29788   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 50); \
  29789 })
  29790 #endif
  29791 
  29792 #ifdef __LITTLE_ENDIAN__
  29793 #define vst1q_u64(__p0, __p1) __extension__ ({ \
  29794   uint64x2_t __s1 = __p1; \
  29795   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 51); \
  29796 })
  29797 #else
  29798 #define vst1q_u64(__p0, __p1) __extension__ ({ \
  29799   uint64x2_t __s1 = __p1; \
  29800   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29801   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 51); \
  29802 })
  29803 #endif
  29804 
  29805 #ifdef __LITTLE_ENDIAN__
  29806 #define vst1q_u16(__p0, __p1) __extension__ ({ \
  29807   uint16x8_t __s1 = __p1; \
  29808   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 49); \
  29809 })
  29810 #else
  29811 #define vst1q_u16(__p0, __p1) __extension__ ({ \
  29812   uint16x8_t __s1 = __p1; \
  29813   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29814   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 49); \
  29815 })
  29816 #endif
  29817 
  29818 #ifdef __LITTLE_ENDIAN__
  29819 #define vst1q_s8(__p0, __p1) __extension__ ({ \
  29820   int8x16_t __s1 = __p1; \
  29821   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 32); \
  29822 })
  29823 #else
  29824 #define vst1q_s8(__p0, __p1) __extension__ ({ \
  29825   int8x16_t __s1 = __p1; \
  29826   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  29827   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 32); \
  29828 })
  29829 #endif
  29830 
  29831 #ifdef __LITTLE_ENDIAN__
  29832 #define vst1q_f32(__p0, __p1) __extension__ ({ \
  29833   float32x4_t __s1 = __p1; \
  29834   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 41); \
  29835 })
  29836 #else
  29837 #define vst1q_f32(__p0, __p1) __extension__ ({ \
  29838   float32x4_t __s1 = __p1; \
  29839   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29840   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 41); \
  29841 })
  29842 #endif
  29843 
  29844 #ifdef __LITTLE_ENDIAN__
  29845 #define vst1q_s32(__p0, __p1) __extension__ ({ \
  29846   int32x4_t __s1 = __p1; \
  29847   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 34); \
  29848 })
  29849 #else
  29850 #define vst1q_s32(__p0, __p1) __extension__ ({ \
  29851   int32x4_t __s1 = __p1; \
  29852   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29853   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 34); \
  29854 })
  29855 #endif
  29856 
  29857 #ifdef __LITTLE_ENDIAN__
  29858 #define vst1q_s64(__p0, __p1) __extension__ ({ \
  29859   int64x2_t __s1 = __p1; \
  29860   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 35); \
  29861 })
  29862 #else
  29863 #define vst1q_s64(__p0, __p1) __extension__ ({ \
  29864   int64x2_t __s1 = __p1; \
  29865   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29866   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 35); \
  29867 })
  29868 #endif
  29869 
  29870 #ifdef __LITTLE_ENDIAN__
  29871 #define vst1q_s16(__p0, __p1) __extension__ ({ \
  29872   int16x8_t __s1 = __p1; \
  29873   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 33); \
  29874 })
  29875 #else
  29876 #define vst1q_s16(__p0, __p1) __extension__ ({ \
  29877   int16x8_t __s1 = __p1; \
  29878   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29879   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 33); \
  29880 })
  29881 #endif
  29882 
  29883 #ifdef __LITTLE_ENDIAN__
  29884 #define vst1_u8(__p0, __p1) __extension__ ({ \
  29885   uint8x8_t __s1 = __p1; \
  29886   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 16); \
  29887 })
  29888 #else
  29889 #define vst1_u8(__p0, __p1) __extension__ ({ \
  29890   uint8x8_t __s1 = __p1; \
  29891   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29892   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 16); \
  29893 })
  29894 #endif
  29895 
  29896 #ifdef __LITTLE_ENDIAN__
  29897 #define vst1_u32(__p0, __p1) __extension__ ({ \
  29898   uint32x2_t __s1 = __p1; \
  29899   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 18); \
  29900 })
  29901 #else
  29902 #define vst1_u32(__p0, __p1) __extension__ ({ \
  29903   uint32x2_t __s1 = __p1; \
  29904   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29905   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 18); \
  29906 })
  29907 #endif
  29908 
  29909 #define vst1_u64(__p0, __p1) __extension__ ({ \
  29910   uint64x1_t __s1 = __p1; \
  29911   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 19); \
  29912 })
  29913 #ifdef __LITTLE_ENDIAN__
  29914 #define vst1_u16(__p0, __p1) __extension__ ({ \
  29915   uint16x4_t __s1 = __p1; \
  29916   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 17); \
  29917 })
  29918 #else
  29919 #define vst1_u16(__p0, __p1) __extension__ ({ \
  29920   uint16x4_t __s1 = __p1; \
  29921   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29922   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 17); \
  29923 })
  29924 #endif
  29925 
  29926 #ifdef __LITTLE_ENDIAN__
  29927 #define vst1_s8(__p0, __p1) __extension__ ({ \
  29928   int8x8_t __s1 = __p1; \
  29929   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 0); \
  29930 })
  29931 #else
  29932 #define vst1_s8(__p0, __p1) __extension__ ({ \
  29933   int8x8_t __s1 = __p1; \
  29934   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29935   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 0); \
  29936 })
  29937 #endif
  29938 
  29939 #ifdef __LITTLE_ENDIAN__
  29940 #define vst1_f32(__p0, __p1) __extension__ ({ \
  29941   float32x2_t __s1 = __p1; \
  29942   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 9); \
  29943 })
  29944 #else
  29945 #define vst1_f32(__p0, __p1) __extension__ ({ \
  29946   float32x2_t __s1 = __p1; \
  29947   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29948   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 9); \
  29949 })
  29950 #endif
  29951 
  29952 #ifdef __LITTLE_ENDIAN__
  29953 #define vst1_s32(__p0, __p1) __extension__ ({ \
  29954   int32x2_t __s1 = __p1; \
  29955   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 2); \
  29956 })
  29957 #else
  29958 #define vst1_s32(__p0, __p1) __extension__ ({ \
  29959   int32x2_t __s1 = __p1; \
  29960   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  29961   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 2); \
  29962 })
  29963 #endif
  29964 
  29965 #define vst1_s64(__p0, __p1) __extension__ ({ \
  29966   int64x1_t __s1 = __p1; \
  29967   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 3); \
  29968 })
  29969 #ifdef __LITTLE_ENDIAN__
  29970 #define vst1_s16(__p0, __p1) __extension__ ({ \
  29971   int16x4_t __s1 = __p1; \
  29972   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 1); \
  29973 })
  29974 #else
  29975 #define vst1_s16(__p0, __p1) __extension__ ({ \
  29976   int16x4_t __s1 = __p1; \
  29977   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  29978   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 1); \
  29979 })
  29980 #endif
  29981 
  29982 #ifdef __LITTLE_ENDIAN__
  29983 #define vst1_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  29984   poly8x8_t __s1 = __p1; \
  29985   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 4); \
  29986 })
  29987 #else
  29988 #define vst1_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  29989   poly8x8_t __s1 = __p1; \
  29990   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  29991   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 4); \
  29992 })
  29993 #endif
  29994 
  29995 #ifdef __LITTLE_ENDIAN__
  29996 #define vst1_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  29997   poly16x4_t __s1 = __p1; \
  29998   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 5); \
  29999 })
  30000 #else
  30001 #define vst1_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  30002   poly16x4_t __s1 = __p1; \
  30003   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  30004   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 5); \
  30005 })
  30006 #endif
  30007 
  30008 #ifdef __LITTLE_ENDIAN__
  30009 #define vst1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  30010   poly8x16_t __s1 = __p1; \
  30011   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 36); \
  30012 })
  30013 #else
  30014 #define vst1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  30015   poly8x16_t __s1 = __p1; \
  30016   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30017   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 36); \
  30018 })
  30019 #endif
  30020 
  30021 #ifdef __LITTLE_ENDIAN__
  30022 #define vst1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  30023   poly16x8_t __s1 = __p1; \
  30024   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 37); \
  30025 })
  30026 #else
  30027 #define vst1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  30028   poly16x8_t __s1 = __p1; \
  30029   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  30030   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 37); \
  30031 })
  30032 #endif
  30033 
  30034 #ifdef __LITTLE_ENDIAN__
  30035 #define vst1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  30036   uint8x16_t __s1 = __p1; \
  30037   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 48); \
  30038 })
  30039 #else
  30040 #define vst1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  30041   uint8x16_t __s1 = __p1; \
  30042   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30043   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 48); \
  30044 })
  30045 #endif
  30046 
  30047 #ifdef __LITTLE_ENDIAN__
  30048 #define vst1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  30049   uint32x4_t __s1 = __p1; \
  30050   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 50); \
  30051 })
  30052 #else
  30053 #define vst1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  30054   uint32x4_t __s1 = __p1; \
  30055   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  30056   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 50); \
  30057 })
  30058 #endif
  30059 
  30060 #ifdef __LITTLE_ENDIAN__
  30061 #define vst1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  30062   uint64x2_t __s1 = __p1; \
  30063   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 51); \
  30064 })
  30065 #else
  30066 #define vst1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  30067   uint64x2_t __s1 = __p1; \
  30068   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  30069   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 51); \
  30070 })
  30071 #endif
  30072 
  30073 #ifdef __LITTLE_ENDIAN__
  30074 #define vst1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  30075   uint16x8_t __s1 = __p1; \
  30076   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 49); \
  30077 })
  30078 #else
  30079 #define vst1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  30080   uint16x8_t __s1 = __p1; \
  30081   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  30082   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 49); \
  30083 })
  30084 #endif
  30085 
  30086 #ifdef __LITTLE_ENDIAN__
  30087 #define vst1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  30088   int8x16_t __s1 = __p1; \
  30089   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 32); \
  30090 })
  30091 #else
  30092 #define vst1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  30093   int8x16_t __s1 = __p1; \
  30094   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30095   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 32); \
  30096 })
  30097 #endif
  30098 
  30099 #ifdef __LITTLE_ENDIAN__
  30100 #define vst1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  30101   float32x4_t __s1 = __p1; \
  30102   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 41); \
  30103 })
  30104 #else
  30105 #define vst1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  30106   float32x4_t __s1 = __p1; \
  30107   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  30108   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 41); \
  30109 })
  30110 #endif
  30111 
  30112 #ifdef __LITTLE_ENDIAN__
  30113 #define vst1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  30114   int32x4_t __s1 = __p1; \
  30115   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 34); \
  30116 })
  30117 #else
  30118 #define vst1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  30119   int32x4_t __s1 = __p1; \
  30120   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  30121   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 34); \
  30122 })
  30123 #endif
  30124 
  30125 #ifdef __LITTLE_ENDIAN__
  30126 #define vst1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  30127   int64x2_t __s1 = __p1; \
  30128   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 35); \
  30129 })
  30130 #else
  30131 #define vst1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  30132   int64x2_t __s1 = __p1; \
  30133   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  30134   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 35); \
  30135 })
  30136 #endif
  30137 
  30138 #ifdef __LITTLE_ENDIAN__
  30139 #define vst1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  30140   int16x8_t __s1 = __p1; \
  30141   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 33); \
  30142 })
  30143 #else
  30144 #define vst1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  30145   int16x8_t __s1 = __p1; \
  30146   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  30147   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 33); \
  30148 })
  30149 #endif
  30150 
  30151 #ifdef __LITTLE_ENDIAN__
  30152 #define vst1_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  30153   uint8x8_t __s1 = __p1; \
  30154   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 16); \
  30155 })
  30156 #else
  30157 #define vst1_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  30158   uint8x8_t __s1 = __p1; \
  30159   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  30160   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 16); \
  30161 })
  30162 #endif
  30163 
  30164 #ifdef __LITTLE_ENDIAN__
  30165 #define vst1_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  30166   uint32x2_t __s1 = __p1; \
  30167   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 18); \
  30168 })
  30169 #else
  30170 #define vst1_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  30171   uint32x2_t __s1 = __p1; \
  30172   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  30173   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 18); \
  30174 })
  30175 #endif
  30176 
  30177 #define vst1_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  30178   uint64x1_t __s1 = __p1; \
  30179   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 19); \
  30180 })
  30181 #ifdef __LITTLE_ENDIAN__
  30182 #define vst1_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  30183   uint16x4_t __s1 = __p1; \
  30184   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 17); \
  30185 })
  30186 #else
  30187 #define vst1_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  30188   uint16x4_t __s1 = __p1; \
  30189   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  30190   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 17); \
  30191 })
  30192 #endif
  30193 
  30194 #ifdef __LITTLE_ENDIAN__
  30195 #define vst1_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  30196   int8x8_t __s1 = __p1; \
  30197   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 0); \
  30198 })
  30199 #else
  30200 #define vst1_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  30201   int8x8_t __s1 = __p1; \
  30202   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  30203   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 0); \
  30204 })
  30205 #endif
  30206 
  30207 #ifdef __LITTLE_ENDIAN__
  30208 #define vst1_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  30209   float32x2_t __s1 = __p1; \
  30210   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 9); \
  30211 })
  30212 #else
  30213 #define vst1_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  30214   float32x2_t __s1 = __p1; \
  30215   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  30216   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 9); \
  30217 })
  30218 #endif
  30219 
  30220 #ifdef __LITTLE_ENDIAN__
  30221 #define vst1_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  30222   int32x2_t __s1 = __p1; \
  30223   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 2); \
  30224 })
  30225 #else
  30226 #define vst1_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  30227   int32x2_t __s1 = __p1; \
  30228   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  30229   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 2); \
  30230 })
  30231 #endif
  30232 
  30233 #define vst1_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  30234   int64x1_t __s1 = __p1; \
  30235   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 3); \
  30236 })
  30237 #ifdef __LITTLE_ENDIAN__
  30238 #define vst1_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  30239   int16x4_t __s1 = __p1; \
  30240   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 1); \
  30241 })
  30242 #else
  30243 #define vst1_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  30244   int16x4_t __s1 = __p1; \
  30245   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  30246   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 1); \
  30247 })
  30248 #endif
  30249 
  30250 #ifdef __LITTLE_ENDIAN__
  30251 #define vst1_p8_x2(__p0, __p1) __extension__ ({ \
  30252   poly8x8x2_t __s1 = __p1; \
  30253   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 4); \
  30254 })
  30255 #else
  30256 #define vst1_p8_x2(__p0, __p1) __extension__ ({ \
  30257   poly8x8x2_t __s1 = __p1; \
  30258   poly8x8x2_t __rev1; \
  30259   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30260   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30261   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 4); \
  30262 })
  30263 #endif
  30264 
  30265 #ifdef __LITTLE_ENDIAN__
  30266 #define vst1_p16_x2(__p0, __p1) __extension__ ({ \
  30267   poly16x4x2_t __s1 = __p1; \
  30268   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 5); \
  30269 })
  30270 #else
  30271 #define vst1_p16_x2(__p0, __p1) __extension__ ({ \
  30272   poly16x4x2_t __s1 = __p1; \
  30273   poly16x4x2_t __rev1; \
  30274   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30275   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30276   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 5); \
  30277 })
  30278 #endif
  30279 
  30280 #ifdef __LITTLE_ENDIAN__
  30281 #define vst1q_p8_x2(__p0, __p1) __extension__ ({ \
  30282   poly8x16x2_t __s1 = __p1; \
  30283   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 36); \
  30284 })
  30285 #else
  30286 #define vst1q_p8_x2(__p0, __p1) __extension__ ({ \
  30287   poly8x16x2_t __s1 = __p1; \
  30288   poly8x16x2_t __rev1; \
  30289   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30290   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30291   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 36); \
  30292 })
  30293 #endif
  30294 
  30295 #ifdef __LITTLE_ENDIAN__
  30296 #define vst1q_p16_x2(__p0, __p1) __extension__ ({ \
  30297   poly16x8x2_t __s1 = __p1; \
  30298   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 37); \
  30299 })
  30300 #else
  30301 #define vst1q_p16_x2(__p0, __p1) __extension__ ({ \
  30302   poly16x8x2_t __s1 = __p1; \
  30303   poly16x8x2_t __rev1; \
  30304   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30305   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30306   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 37); \
  30307 })
  30308 #endif
  30309 
  30310 #ifdef __LITTLE_ENDIAN__
  30311 #define vst1q_u8_x2(__p0, __p1) __extension__ ({ \
  30312   uint8x16x2_t __s1 = __p1; \
  30313   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 48); \
  30314 })
  30315 #else
  30316 #define vst1q_u8_x2(__p0, __p1) __extension__ ({ \
  30317   uint8x16x2_t __s1 = __p1; \
  30318   uint8x16x2_t __rev1; \
  30319   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30320   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30321   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 48); \
  30322 })
  30323 #endif
  30324 
  30325 #ifdef __LITTLE_ENDIAN__
  30326 #define vst1q_u32_x2(__p0, __p1) __extension__ ({ \
  30327   uint32x4x2_t __s1 = __p1; \
  30328   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 50); \
  30329 })
  30330 #else
  30331 #define vst1q_u32_x2(__p0, __p1) __extension__ ({ \
  30332   uint32x4x2_t __s1 = __p1; \
  30333   uint32x4x2_t __rev1; \
  30334   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30335   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30336   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 50); \
  30337 })
  30338 #endif
  30339 
  30340 #ifdef __LITTLE_ENDIAN__
  30341 #define vst1q_u64_x2(__p0, __p1) __extension__ ({ \
  30342   uint64x2x2_t __s1 = __p1; \
  30343   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 51); \
  30344 })
  30345 #else
  30346 #define vst1q_u64_x2(__p0, __p1) __extension__ ({ \
  30347   uint64x2x2_t __s1 = __p1; \
  30348   uint64x2x2_t __rev1; \
  30349   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30350   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30351   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 51); \
  30352 })
  30353 #endif
  30354 
  30355 #ifdef __LITTLE_ENDIAN__
  30356 #define vst1q_u16_x2(__p0, __p1) __extension__ ({ \
  30357   uint16x8x2_t __s1 = __p1; \
  30358   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 49); \
  30359 })
  30360 #else
  30361 #define vst1q_u16_x2(__p0, __p1) __extension__ ({ \
  30362   uint16x8x2_t __s1 = __p1; \
  30363   uint16x8x2_t __rev1; \
  30364   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30365   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30366   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 49); \
  30367 })
  30368 #endif
  30369 
  30370 #ifdef __LITTLE_ENDIAN__
  30371 #define vst1q_s8_x2(__p0, __p1) __extension__ ({ \
  30372   int8x16x2_t __s1 = __p1; \
  30373   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 32); \
  30374 })
  30375 #else
  30376 #define vst1q_s8_x2(__p0, __p1) __extension__ ({ \
  30377   int8x16x2_t __s1 = __p1; \
  30378   int8x16x2_t __rev1; \
  30379   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30380   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30381   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 32); \
  30382 })
  30383 #endif
  30384 
  30385 #ifdef __LITTLE_ENDIAN__
  30386 #define vst1q_f32_x2(__p0, __p1) __extension__ ({ \
  30387   float32x4x2_t __s1 = __p1; \
  30388   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 41); \
  30389 })
  30390 #else
  30391 #define vst1q_f32_x2(__p0, __p1) __extension__ ({ \
  30392   float32x4x2_t __s1 = __p1; \
  30393   float32x4x2_t __rev1; \
  30394   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30395   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30396   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 41); \
  30397 })
  30398 #endif
  30399 
  30400 #ifdef __LITTLE_ENDIAN__
  30401 #define vst1q_s32_x2(__p0, __p1) __extension__ ({ \
  30402   int32x4x2_t __s1 = __p1; \
  30403   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 34); \
  30404 })
  30405 #else
  30406 #define vst1q_s32_x2(__p0, __p1) __extension__ ({ \
  30407   int32x4x2_t __s1 = __p1; \
  30408   int32x4x2_t __rev1; \
  30409   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30410   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30411   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 34); \
  30412 })
  30413 #endif
  30414 
  30415 #ifdef __LITTLE_ENDIAN__
  30416 #define vst1q_s64_x2(__p0, __p1) __extension__ ({ \
  30417   int64x2x2_t __s1 = __p1; \
  30418   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 35); \
  30419 })
  30420 #else
  30421 #define vst1q_s64_x2(__p0, __p1) __extension__ ({ \
  30422   int64x2x2_t __s1 = __p1; \
  30423   int64x2x2_t __rev1; \
  30424   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30425   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30426   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 35); \
  30427 })
  30428 #endif
  30429 
  30430 #ifdef __LITTLE_ENDIAN__
  30431 #define vst1q_s16_x2(__p0, __p1) __extension__ ({ \
  30432   int16x8x2_t __s1 = __p1; \
  30433   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 33); \
  30434 })
  30435 #else
  30436 #define vst1q_s16_x2(__p0, __p1) __extension__ ({ \
  30437   int16x8x2_t __s1 = __p1; \
  30438   int16x8x2_t __rev1; \
  30439   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30440   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30441   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 33); \
  30442 })
  30443 #endif
  30444 
  30445 #ifdef __LITTLE_ENDIAN__
  30446 #define vst1_u8_x2(__p0, __p1) __extension__ ({ \
  30447   uint8x8x2_t __s1 = __p1; \
  30448   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 16); \
  30449 })
  30450 #else
  30451 #define vst1_u8_x2(__p0, __p1) __extension__ ({ \
  30452   uint8x8x2_t __s1 = __p1; \
  30453   uint8x8x2_t __rev1; \
  30454   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30455   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30456   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 16); \
  30457 })
  30458 #endif
  30459 
  30460 #ifdef __LITTLE_ENDIAN__
  30461 #define vst1_u32_x2(__p0, __p1) __extension__ ({ \
  30462   uint32x2x2_t __s1 = __p1; \
  30463   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 18); \
  30464 })
  30465 #else
  30466 #define vst1_u32_x2(__p0, __p1) __extension__ ({ \
  30467   uint32x2x2_t __s1 = __p1; \
  30468   uint32x2x2_t __rev1; \
  30469   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30470   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30471   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 18); \
  30472 })
  30473 #endif
  30474 
  30475 #define vst1_u64_x2(__p0, __p1) __extension__ ({ \
  30476   uint64x1x2_t __s1 = __p1; \
  30477   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 19); \
  30478 })
  30479 #ifdef __LITTLE_ENDIAN__
  30480 #define vst1_u16_x2(__p0, __p1) __extension__ ({ \
  30481   uint16x4x2_t __s1 = __p1; \
  30482   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 17); \
  30483 })
  30484 #else
  30485 #define vst1_u16_x2(__p0, __p1) __extension__ ({ \
  30486   uint16x4x2_t __s1 = __p1; \
  30487   uint16x4x2_t __rev1; \
  30488   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30489   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30490   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 17); \
  30491 })
  30492 #endif
  30493 
  30494 #ifdef __LITTLE_ENDIAN__
  30495 #define vst1_s8_x2(__p0, __p1) __extension__ ({ \
  30496   int8x8x2_t __s1 = __p1; \
  30497   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 0); \
  30498 })
  30499 #else
  30500 #define vst1_s8_x2(__p0, __p1) __extension__ ({ \
  30501   int8x8x2_t __s1 = __p1; \
  30502   int8x8x2_t __rev1; \
  30503   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30504   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30505   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 0); \
  30506 })
  30507 #endif
  30508 
  30509 #ifdef __LITTLE_ENDIAN__
  30510 #define vst1_f32_x2(__p0, __p1) __extension__ ({ \
  30511   float32x2x2_t __s1 = __p1; \
  30512   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 9); \
  30513 })
  30514 #else
  30515 #define vst1_f32_x2(__p0, __p1) __extension__ ({ \
  30516   float32x2x2_t __s1 = __p1; \
  30517   float32x2x2_t __rev1; \
  30518   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30519   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30520   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 9); \
  30521 })
  30522 #endif
  30523 
  30524 #ifdef __LITTLE_ENDIAN__
  30525 #define vst1_s32_x2(__p0, __p1) __extension__ ({ \
  30526   int32x2x2_t __s1 = __p1; \
  30527   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 2); \
  30528 })
  30529 #else
  30530 #define vst1_s32_x2(__p0, __p1) __extension__ ({ \
  30531   int32x2x2_t __s1 = __p1; \
  30532   int32x2x2_t __rev1; \
  30533   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30534   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30535   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 2); \
  30536 })
  30537 #endif
  30538 
  30539 #define vst1_s64_x2(__p0, __p1) __extension__ ({ \
  30540   int64x1x2_t __s1 = __p1; \
  30541   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 3); \
  30542 })
  30543 #ifdef __LITTLE_ENDIAN__
  30544 #define vst1_s16_x2(__p0, __p1) __extension__ ({ \
  30545   int16x4x2_t __s1 = __p1; \
  30546   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 1); \
  30547 })
  30548 #else
  30549 #define vst1_s16_x2(__p0, __p1) __extension__ ({ \
  30550   int16x4x2_t __s1 = __p1; \
  30551   int16x4x2_t __rev1; \
  30552   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30553   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30554   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 1); \
  30555 })
  30556 #endif
  30557 
  30558 #ifdef __LITTLE_ENDIAN__
  30559 #define vst1_p8_x3(__p0, __p1) __extension__ ({ \
  30560   poly8x8x3_t __s1 = __p1; \
  30561   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 4); \
  30562 })
  30563 #else
  30564 #define vst1_p8_x3(__p0, __p1) __extension__ ({ \
  30565   poly8x8x3_t __s1 = __p1; \
  30566   poly8x8x3_t __rev1; \
  30567   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30568   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30569   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30570   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 4); \
  30571 })
  30572 #endif
  30573 
  30574 #ifdef __LITTLE_ENDIAN__
  30575 #define vst1_p16_x3(__p0, __p1) __extension__ ({ \
  30576   poly16x4x3_t __s1 = __p1; \
  30577   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 5); \
  30578 })
  30579 #else
  30580 #define vst1_p16_x3(__p0, __p1) __extension__ ({ \
  30581   poly16x4x3_t __s1 = __p1; \
  30582   poly16x4x3_t __rev1; \
  30583   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30584   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30585   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30586   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 5); \
  30587 })
  30588 #endif
  30589 
  30590 #ifdef __LITTLE_ENDIAN__
  30591 #define vst1q_p8_x3(__p0, __p1) __extension__ ({ \
  30592   poly8x16x3_t __s1 = __p1; \
  30593   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 36); \
  30594 })
  30595 #else
  30596 #define vst1q_p8_x3(__p0, __p1) __extension__ ({ \
  30597   poly8x16x3_t __s1 = __p1; \
  30598   poly8x16x3_t __rev1; \
  30599   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30600   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30601   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30602   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 36); \
  30603 })
  30604 #endif
  30605 
  30606 #ifdef __LITTLE_ENDIAN__
  30607 #define vst1q_p16_x3(__p0, __p1) __extension__ ({ \
  30608   poly16x8x3_t __s1 = __p1; \
  30609   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 37); \
  30610 })
  30611 #else
  30612 #define vst1q_p16_x3(__p0, __p1) __extension__ ({ \
  30613   poly16x8x3_t __s1 = __p1; \
  30614   poly16x8x3_t __rev1; \
  30615   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30616   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30617   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30618   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 37); \
  30619 })
  30620 #endif
  30621 
  30622 #ifdef __LITTLE_ENDIAN__
  30623 #define vst1q_u8_x3(__p0, __p1) __extension__ ({ \
  30624   uint8x16x3_t __s1 = __p1; \
  30625   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 48); \
  30626 })
  30627 #else
  30628 #define vst1q_u8_x3(__p0, __p1) __extension__ ({ \
  30629   uint8x16x3_t __s1 = __p1; \
  30630   uint8x16x3_t __rev1; \
  30631   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30632   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30633   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30634   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 48); \
  30635 })
  30636 #endif
  30637 
  30638 #ifdef __LITTLE_ENDIAN__
  30639 #define vst1q_u32_x3(__p0, __p1) __extension__ ({ \
  30640   uint32x4x3_t __s1 = __p1; \
  30641   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 50); \
  30642 })
  30643 #else
  30644 #define vst1q_u32_x3(__p0, __p1) __extension__ ({ \
  30645   uint32x4x3_t __s1 = __p1; \
  30646   uint32x4x3_t __rev1; \
  30647   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30648   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30649   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30650   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 50); \
  30651 })
  30652 #endif
  30653 
  30654 #ifdef __LITTLE_ENDIAN__
  30655 #define vst1q_u64_x3(__p0, __p1) __extension__ ({ \
  30656   uint64x2x3_t __s1 = __p1; \
  30657   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 51); \
  30658 })
  30659 #else
  30660 #define vst1q_u64_x3(__p0, __p1) __extension__ ({ \
  30661   uint64x2x3_t __s1 = __p1; \
  30662   uint64x2x3_t __rev1; \
  30663   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30664   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30665   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  30666   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 51); \
  30667 })
  30668 #endif
  30669 
  30670 #ifdef __LITTLE_ENDIAN__
  30671 #define vst1q_u16_x3(__p0, __p1) __extension__ ({ \
  30672   uint16x8x3_t __s1 = __p1; \
  30673   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 49); \
  30674 })
  30675 #else
  30676 #define vst1q_u16_x3(__p0, __p1) __extension__ ({ \
  30677   uint16x8x3_t __s1 = __p1; \
  30678   uint16x8x3_t __rev1; \
  30679   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30680   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30681   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30682   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 49); \
  30683 })
  30684 #endif
  30685 
  30686 #ifdef __LITTLE_ENDIAN__
  30687 #define vst1q_s8_x3(__p0, __p1) __extension__ ({ \
  30688   int8x16x3_t __s1 = __p1; \
  30689   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 32); \
  30690 })
  30691 #else
  30692 #define vst1q_s8_x3(__p0, __p1) __extension__ ({ \
  30693   int8x16x3_t __s1 = __p1; \
  30694   int8x16x3_t __rev1; \
  30695   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30696   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30697   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30698   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 32); \
  30699 })
  30700 #endif
  30701 
  30702 #ifdef __LITTLE_ENDIAN__
  30703 #define vst1q_f32_x3(__p0, __p1) __extension__ ({ \
  30704   float32x4x3_t __s1 = __p1; \
  30705   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 41); \
  30706 })
  30707 #else
  30708 #define vst1q_f32_x3(__p0, __p1) __extension__ ({ \
  30709   float32x4x3_t __s1 = __p1; \
  30710   float32x4x3_t __rev1; \
  30711   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30712   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30713   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30714   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 41); \
  30715 })
  30716 #endif
  30717 
  30718 #ifdef __LITTLE_ENDIAN__
  30719 #define vst1q_s32_x3(__p0, __p1) __extension__ ({ \
  30720   int32x4x3_t __s1 = __p1; \
  30721   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 34); \
  30722 })
  30723 #else
  30724 #define vst1q_s32_x3(__p0, __p1) __extension__ ({ \
  30725   int32x4x3_t __s1 = __p1; \
  30726   int32x4x3_t __rev1; \
  30727   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30728   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30729   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30730   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 34); \
  30731 })
  30732 #endif
  30733 
  30734 #ifdef __LITTLE_ENDIAN__
  30735 #define vst1q_s64_x3(__p0, __p1) __extension__ ({ \
  30736   int64x2x3_t __s1 = __p1; \
  30737   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 35); \
  30738 })
  30739 #else
  30740 #define vst1q_s64_x3(__p0, __p1) __extension__ ({ \
  30741   int64x2x3_t __s1 = __p1; \
  30742   int64x2x3_t __rev1; \
  30743   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30744   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30745   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  30746   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 35); \
  30747 })
  30748 #endif
  30749 
  30750 #ifdef __LITTLE_ENDIAN__
  30751 #define vst1q_s16_x3(__p0, __p1) __extension__ ({ \
  30752   int16x8x3_t __s1 = __p1; \
  30753   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 33); \
  30754 })
  30755 #else
  30756 #define vst1q_s16_x3(__p0, __p1) __extension__ ({ \
  30757   int16x8x3_t __s1 = __p1; \
  30758   int16x8x3_t __rev1; \
  30759   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30760   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30761   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30762   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 33); \
  30763 })
  30764 #endif
  30765 
  30766 #ifdef __LITTLE_ENDIAN__
  30767 #define vst1_u8_x3(__p0, __p1) __extension__ ({ \
  30768   uint8x8x3_t __s1 = __p1; \
  30769   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 16); \
  30770 })
  30771 #else
  30772 #define vst1_u8_x3(__p0, __p1) __extension__ ({ \
  30773   uint8x8x3_t __s1 = __p1; \
  30774   uint8x8x3_t __rev1; \
  30775   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30776   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30777   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30778   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 16); \
  30779 })
  30780 #endif
  30781 
  30782 #ifdef __LITTLE_ENDIAN__
  30783 #define vst1_u32_x3(__p0, __p1) __extension__ ({ \
  30784   uint32x2x3_t __s1 = __p1; \
  30785   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 18); \
  30786 })
  30787 #else
  30788 #define vst1_u32_x3(__p0, __p1) __extension__ ({ \
  30789   uint32x2x3_t __s1 = __p1; \
  30790   uint32x2x3_t __rev1; \
  30791   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30792   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30793   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  30794   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 18); \
  30795 })
  30796 #endif
  30797 
  30798 #define vst1_u64_x3(__p0, __p1) __extension__ ({ \
  30799   uint64x1x3_t __s1 = __p1; \
  30800   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 19); \
  30801 })
  30802 #ifdef __LITTLE_ENDIAN__
  30803 #define vst1_u16_x3(__p0, __p1) __extension__ ({ \
  30804   uint16x4x3_t __s1 = __p1; \
  30805   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 17); \
  30806 })
  30807 #else
  30808 #define vst1_u16_x3(__p0, __p1) __extension__ ({ \
  30809   uint16x4x3_t __s1 = __p1; \
  30810   uint16x4x3_t __rev1; \
  30811   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30812   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30813   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30814   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 17); \
  30815 })
  30816 #endif
  30817 
  30818 #ifdef __LITTLE_ENDIAN__
  30819 #define vst1_s8_x3(__p0, __p1) __extension__ ({ \
  30820   int8x8x3_t __s1 = __p1; \
  30821   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 0); \
  30822 })
  30823 #else
  30824 #define vst1_s8_x3(__p0, __p1) __extension__ ({ \
  30825   int8x8x3_t __s1 = __p1; \
  30826   int8x8x3_t __rev1; \
  30827   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30828   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30829   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30830   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 0); \
  30831 })
  30832 #endif
  30833 
  30834 #ifdef __LITTLE_ENDIAN__
  30835 #define vst1_f32_x3(__p0, __p1) __extension__ ({ \
  30836   float32x2x3_t __s1 = __p1; \
  30837   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 9); \
  30838 })
  30839 #else
  30840 #define vst1_f32_x3(__p0, __p1) __extension__ ({ \
  30841   float32x2x3_t __s1 = __p1; \
  30842   float32x2x3_t __rev1; \
  30843   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30844   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30845   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  30846   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 9); \
  30847 })
  30848 #endif
  30849 
  30850 #ifdef __LITTLE_ENDIAN__
  30851 #define vst1_s32_x3(__p0, __p1) __extension__ ({ \
  30852   int32x2x3_t __s1 = __p1; \
  30853   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 2); \
  30854 })
  30855 #else
  30856 #define vst1_s32_x3(__p0, __p1) __extension__ ({ \
  30857   int32x2x3_t __s1 = __p1; \
  30858   int32x2x3_t __rev1; \
  30859   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30860   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30861   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  30862   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 2); \
  30863 })
  30864 #endif
  30865 
  30866 #define vst1_s64_x3(__p0, __p1) __extension__ ({ \
  30867   int64x1x3_t __s1 = __p1; \
  30868   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 3); \
  30869 })
  30870 #ifdef __LITTLE_ENDIAN__
  30871 #define vst1_s16_x3(__p0, __p1) __extension__ ({ \
  30872   int16x4x3_t __s1 = __p1; \
  30873   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 1); \
  30874 })
  30875 #else
  30876 #define vst1_s16_x3(__p0, __p1) __extension__ ({ \
  30877   int16x4x3_t __s1 = __p1; \
  30878   int16x4x3_t __rev1; \
  30879   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30880   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30881   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30882   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 1); \
  30883 })
  30884 #endif
  30885 
  30886 #ifdef __LITTLE_ENDIAN__
  30887 #define vst1_p8_x4(__p0, __p1) __extension__ ({ \
  30888   poly8x8x4_t __s1 = __p1; \
  30889   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 4); \
  30890 })
  30891 #else
  30892 #define vst1_p8_x4(__p0, __p1) __extension__ ({ \
  30893   poly8x8x4_t __s1 = __p1; \
  30894   poly8x8x4_t __rev1; \
  30895   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30896   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30897   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30898   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  30899   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 4); \
  30900 })
  30901 #endif
  30902 
  30903 #ifdef __LITTLE_ENDIAN__
  30904 #define vst1_p16_x4(__p0, __p1) __extension__ ({ \
  30905   poly16x4x4_t __s1 = __p1; \
  30906   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 5); \
  30907 })
  30908 #else
  30909 #define vst1_p16_x4(__p0, __p1) __extension__ ({ \
  30910   poly16x4x4_t __s1 = __p1; \
  30911   poly16x4x4_t __rev1; \
  30912   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30913   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30914   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30915   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  30916   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 5); \
  30917 })
  30918 #endif
  30919 
  30920 #ifdef __LITTLE_ENDIAN__
  30921 #define vst1q_p8_x4(__p0, __p1) __extension__ ({ \
  30922   poly8x16x4_t __s1 = __p1; \
  30923   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 36); \
  30924 })
  30925 #else
  30926 #define vst1q_p8_x4(__p0, __p1) __extension__ ({ \
  30927   poly8x16x4_t __s1 = __p1; \
  30928   poly8x16x4_t __rev1; \
  30929   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30930   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30931   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30932   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30933   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 36); \
  30934 })
  30935 #endif
  30936 
  30937 #ifdef __LITTLE_ENDIAN__
  30938 #define vst1q_p16_x4(__p0, __p1) __extension__ ({ \
  30939   poly16x8x4_t __s1 = __p1; \
  30940   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 37); \
  30941 })
  30942 #else
  30943 #define vst1q_p16_x4(__p0, __p1) __extension__ ({ \
  30944   poly16x8x4_t __s1 = __p1; \
  30945   poly16x8x4_t __rev1; \
  30946   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  30947   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  30948   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  30949   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  30950   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 37); \
  30951 })
  30952 #endif
  30953 
  30954 #ifdef __LITTLE_ENDIAN__
  30955 #define vst1q_u8_x4(__p0, __p1) __extension__ ({ \
  30956   uint8x16x4_t __s1 = __p1; \
  30957   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 48); \
  30958 })
  30959 #else
  30960 #define vst1q_u8_x4(__p0, __p1) __extension__ ({ \
  30961   uint8x16x4_t __s1 = __p1; \
  30962   uint8x16x4_t __rev1; \
  30963   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30964   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30965   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30966   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  30967   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 48); \
  30968 })
  30969 #endif
  30970 
  30971 #ifdef __LITTLE_ENDIAN__
  30972 #define vst1q_u32_x4(__p0, __p1) __extension__ ({ \
  30973   uint32x4x4_t __s1 = __p1; \
  30974   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 50); \
  30975 })
  30976 #else
  30977 #define vst1q_u32_x4(__p0, __p1) __extension__ ({ \
  30978   uint32x4x4_t __s1 = __p1; \
  30979   uint32x4x4_t __rev1; \
  30980   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  30981   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  30982   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  30983   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  30984   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 50); \
  30985 })
  30986 #endif
  30987 
  30988 #ifdef __LITTLE_ENDIAN__
  30989 #define vst1q_u64_x4(__p0, __p1) __extension__ ({ \
  30990   uint64x2x4_t __s1 = __p1; \
  30991   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 51); \
  30992 })
  30993 #else
  30994 #define vst1q_u64_x4(__p0, __p1) __extension__ ({ \
  30995   uint64x2x4_t __s1 = __p1; \
  30996   uint64x2x4_t __rev1; \
  30997   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  30998   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  30999   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31000   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  31001   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 51); \
  31002 })
  31003 #endif
  31004 
  31005 #ifdef __LITTLE_ENDIAN__
  31006 #define vst1q_u16_x4(__p0, __p1) __extension__ ({ \
  31007   uint16x8x4_t __s1 = __p1; \
  31008   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 49); \
  31009 })
  31010 #else
  31011 #define vst1q_u16_x4(__p0, __p1) __extension__ ({ \
  31012   uint16x8x4_t __s1 = __p1; \
  31013   uint16x8x4_t __rev1; \
  31014   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31015   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31016   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31017   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  31018   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 49); \
  31019 })
  31020 #endif
  31021 
  31022 #ifdef __LITTLE_ENDIAN__
  31023 #define vst1q_s8_x4(__p0, __p1) __extension__ ({ \
  31024   int8x16x4_t __s1 = __p1; \
  31025   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 32); \
  31026 })
  31027 #else
  31028 #define vst1q_s8_x4(__p0, __p1) __extension__ ({ \
  31029   int8x16x4_t __s1 = __p1; \
  31030   int8x16x4_t __rev1; \
  31031   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31032   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31033   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31034   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31035   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 32); \
  31036 })
  31037 #endif
  31038 
  31039 #ifdef __LITTLE_ENDIAN__
  31040 #define vst1q_f32_x4(__p0, __p1) __extension__ ({ \
  31041   float32x4x4_t __s1 = __p1; \
  31042   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 41); \
  31043 })
  31044 #else
  31045 #define vst1q_f32_x4(__p0, __p1) __extension__ ({ \
  31046   float32x4x4_t __s1 = __p1; \
  31047   float32x4x4_t __rev1; \
  31048   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31049   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31050   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31051   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  31052   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 41); \
  31053 })
  31054 #endif
  31055 
  31056 #ifdef __LITTLE_ENDIAN__
  31057 #define vst1q_s32_x4(__p0, __p1) __extension__ ({ \
  31058   int32x4x4_t __s1 = __p1; \
  31059   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 34); \
  31060 })
  31061 #else
  31062 #define vst1q_s32_x4(__p0, __p1) __extension__ ({ \
  31063   int32x4x4_t __s1 = __p1; \
  31064   int32x4x4_t __rev1; \
  31065   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31066   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31067   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31068   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  31069   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 34); \
  31070 })
  31071 #endif
  31072 
  31073 #ifdef __LITTLE_ENDIAN__
  31074 #define vst1q_s64_x4(__p0, __p1) __extension__ ({ \
  31075   int64x2x4_t __s1 = __p1; \
  31076   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 35); \
  31077 })
  31078 #else
  31079 #define vst1q_s64_x4(__p0, __p1) __extension__ ({ \
  31080   int64x2x4_t __s1 = __p1; \
  31081   int64x2x4_t __rev1; \
  31082   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31083   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31084   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31085   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  31086   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 35); \
  31087 })
  31088 #endif
  31089 
  31090 #ifdef __LITTLE_ENDIAN__
  31091 #define vst1q_s16_x4(__p0, __p1) __extension__ ({ \
  31092   int16x8x4_t __s1 = __p1; \
  31093   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 33); \
  31094 })
  31095 #else
  31096 #define vst1q_s16_x4(__p0, __p1) __extension__ ({ \
  31097   int16x8x4_t __s1 = __p1; \
  31098   int16x8x4_t __rev1; \
  31099   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31100   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31101   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31102   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  31103   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 33); \
  31104 })
  31105 #endif
  31106 
  31107 #ifdef __LITTLE_ENDIAN__
  31108 #define vst1_u8_x4(__p0, __p1) __extension__ ({ \
  31109   uint8x8x4_t __s1 = __p1; \
  31110   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 16); \
  31111 })
  31112 #else
  31113 #define vst1_u8_x4(__p0, __p1) __extension__ ({ \
  31114   uint8x8x4_t __s1 = __p1; \
  31115   uint8x8x4_t __rev1; \
  31116   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31117   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31118   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31119   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  31120   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 16); \
  31121 })
  31122 #endif
  31123 
  31124 #ifdef __LITTLE_ENDIAN__
  31125 #define vst1_u32_x4(__p0, __p1) __extension__ ({ \
  31126   uint32x2x4_t __s1 = __p1; \
  31127   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 18); \
  31128 })
  31129 #else
  31130 #define vst1_u32_x4(__p0, __p1) __extension__ ({ \
  31131   uint32x2x4_t __s1 = __p1; \
  31132   uint32x2x4_t __rev1; \
  31133   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31134   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31135   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31136   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  31137   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 18); \
  31138 })
  31139 #endif
  31140 
  31141 #define vst1_u64_x4(__p0, __p1) __extension__ ({ \
  31142   uint64x1x4_t __s1 = __p1; \
  31143   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 19); \
  31144 })
  31145 #ifdef __LITTLE_ENDIAN__
  31146 #define vst1_u16_x4(__p0, __p1) __extension__ ({ \
  31147   uint16x4x4_t __s1 = __p1; \
  31148   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 17); \
  31149 })
  31150 #else
  31151 #define vst1_u16_x4(__p0, __p1) __extension__ ({ \
  31152   uint16x4x4_t __s1 = __p1; \
  31153   uint16x4x4_t __rev1; \
  31154   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31155   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31156   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31157   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  31158   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 17); \
  31159 })
  31160 #endif
  31161 
  31162 #ifdef __LITTLE_ENDIAN__
  31163 #define vst1_s8_x4(__p0, __p1) __extension__ ({ \
  31164   int8x8x4_t __s1 = __p1; \
  31165   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 0); \
  31166 })
  31167 #else
  31168 #define vst1_s8_x4(__p0, __p1) __extension__ ({ \
  31169   int8x8x4_t __s1 = __p1; \
  31170   int8x8x4_t __rev1; \
  31171   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31172   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31173   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31174   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  31175   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 0); \
  31176 })
  31177 #endif
  31178 
  31179 #ifdef __LITTLE_ENDIAN__
  31180 #define vst1_f32_x4(__p0, __p1) __extension__ ({ \
  31181   float32x2x4_t __s1 = __p1; \
  31182   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 9); \
  31183 })
  31184 #else
  31185 #define vst1_f32_x4(__p0, __p1) __extension__ ({ \
  31186   float32x2x4_t __s1 = __p1; \
  31187   float32x2x4_t __rev1; \
  31188   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31189   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31190   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31191   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  31192   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 9); \
  31193 })
  31194 #endif
  31195 
  31196 #ifdef __LITTLE_ENDIAN__
  31197 #define vst1_s32_x4(__p0, __p1) __extension__ ({ \
  31198   int32x2x4_t __s1 = __p1; \
  31199   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 2); \
  31200 })
  31201 #else
  31202 #define vst1_s32_x4(__p0, __p1) __extension__ ({ \
  31203   int32x2x4_t __s1 = __p1; \
  31204   int32x2x4_t __rev1; \
  31205   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31206   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31207   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31208   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  31209   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 2); \
  31210 })
  31211 #endif
  31212 
  31213 #define vst1_s64_x4(__p0, __p1) __extension__ ({ \
  31214   int64x1x4_t __s1 = __p1; \
  31215   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 3); \
  31216 })
  31217 #ifdef __LITTLE_ENDIAN__
  31218 #define vst1_s16_x4(__p0, __p1) __extension__ ({ \
  31219   int16x4x4_t __s1 = __p1; \
  31220   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 1); \
  31221 })
  31222 #else
  31223 #define vst1_s16_x4(__p0, __p1) __extension__ ({ \
  31224   int16x4x4_t __s1 = __p1; \
  31225   int16x4x4_t __rev1; \
  31226   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31227   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31228   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31229   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  31230   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 1); \
  31231 })
  31232 #endif
  31233 
  31234 #ifdef __LITTLE_ENDIAN__
  31235 #define vst2_p8(__p0, __p1) __extension__ ({ \
  31236   poly8x8x2_t __s1 = __p1; \
  31237   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 4); \
  31238 })
  31239 #else
  31240 #define vst2_p8(__p0, __p1) __extension__ ({ \
  31241   poly8x8x2_t __s1 = __p1; \
  31242   poly8x8x2_t __rev1; \
  31243   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31244   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31245   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 4); \
  31246 })
  31247 #endif
  31248 
  31249 #ifdef __LITTLE_ENDIAN__
  31250 #define vst2_p16(__p0, __p1) __extension__ ({ \
  31251   poly16x4x2_t __s1 = __p1; \
  31252   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 5); \
  31253 })
  31254 #else
  31255 #define vst2_p16(__p0, __p1) __extension__ ({ \
  31256   poly16x4x2_t __s1 = __p1; \
  31257   poly16x4x2_t __rev1; \
  31258   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31259   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31260   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 5); \
  31261 })
  31262 #endif
  31263 
  31264 #ifdef __LITTLE_ENDIAN__
  31265 #define vst2q_p8(__p0, __p1) __extension__ ({ \
  31266   poly8x16x2_t __s1 = __p1; \
  31267   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 36); \
  31268 })
  31269 #else
  31270 #define vst2q_p8(__p0, __p1) __extension__ ({ \
  31271   poly8x16x2_t __s1 = __p1; \
  31272   poly8x16x2_t __rev1; \
  31273   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31274   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31275   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 36); \
  31276 })
  31277 #endif
  31278 
  31279 #ifdef __LITTLE_ENDIAN__
  31280 #define vst2q_p16(__p0, __p1) __extension__ ({ \
  31281   poly16x8x2_t __s1 = __p1; \
  31282   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 37); \
  31283 })
  31284 #else
  31285 #define vst2q_p16(__p0, __p1) __extension__ ({ \
  31286   poly16x8x2_t __s1 = __p1; \
  31287   poly16x8x2_t __rev1; \
  31288   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31289   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31290   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 37); \
  31291 })
  31292 #endif
  31293 
  31294 #ifdef __LITTLE_ENDIAN__
  31295 #define vst2q_u8(__p0, __p1) __extension__ ({ \
  31296   uint8x16x2_t __s1 = __p1; \
  31297   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 48); \
  31298 })
  31299 #else
  31300 #define vst2q_u8(__p0, __p1) __extension__ ({ \
  31301   uint8x16x2_t __s1 = __p1; \
  31302   uint8x16x2_t __rev1; \
  31303   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31304   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31305   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 48); \
  31306 })
  31307 #endif
  31308 
  31309 #ifdef __LITTLE_ENDIAN__
  31310 #define vst2q_u32(__p0, __p1) __extension__ ({ \
  31311   uint32x4x2_t __s1 = __p1; \
  31312   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 50); \
  31313 })
  31314 #else
  31315 #define vst2q_u32(__p0, __p1) __extension__ ({ \
  31316   uint32x4x2_t __s1 = __p1; \
  31317   uint32x4x2_t __rev1; \
  31318   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31319   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31320   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 50); \
  31321 })
  31322 #endif
  31323 
  31324 #ifdef __LITTLE_ENDIAN__
  31325 #define vst2q_u16(__p0, __p1) __extension__ ({ \
  31326   uint16x8x2_t __s1 = __p1; \
  31327   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 49); \
  31328 })
  31329 #else
  31330 #define vst2q_u16(__p0, __p1) __extension__ ({ \
  31331   uint16x8x2_t __s1 = __p1; \
  31332   uint16x8x2_t __rev1; \
  31333   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31334   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31335   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 49); \
  31336 })
  31337 #endif
  31338 
  31339 #ifdef __LITTLE_ENDIAN__
  31340 #define vst2q_s8(__p0, __p1) __extension__ ({ \
  31341   int8x16x2_t __s1 = __p1; \
  31342   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 32); \
  31343 })
  31344 #else
  31345 #define vst2q_s8(__p0, __p1) __extension__ ({ \
  31346   int8x16x2_t __s1 = __p1; \
  31347   int8x16x2_t __rev1; \
  31348   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31349   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31350   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 32); \
  31351 })
  31352 #endif
  31353 
  31354 #ifdef __LITTLE_ENDIAN__
  31355 #define vst2q_f32(__p0, __p1) __extension__ ({ \
  31356   float32x4x2_t __s1 = __p1; \
  31357   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 41); \
  31358 })
  31359 #else
  31360 #define vst2q_f32(__p0, __p1) __extension__ ({ \
  31361   float32x4x2_t __s1 = __p1; \
  31362   float32x4x2_t __rev1; \
  31363   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31364   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31365   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 41); \
  31366 })
  31367 #endif
  31368 
  31369 #ifdef __LITTLE_ENDIAN__
  31370 #define vst2q_s32(__p0, __p1) __extension__ ({ \
  31371   int32x4x2_t __s1 = __p1; \
  31372   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 34); \
  31373 })
  31374 #else
  31375 #define vst2q_s32(__p0, __p1) __extension__ ({ \
  31376   int32x4x2_t __s1 = __p1; \
  31377   int32x4x2_t __rev1; \
  31378   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31379   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31380   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 34); \
  31381 })
  31382 #endif
  31383 
  31384 #ifdef __LITTLE_ENDIAN__
  31385 #define vst2q_s16(__p0, __p1) __extension__ ({ \
  31386   int16x8x2_t __s1 = __p1; \
  31387   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 33); \
  31388 })
  31389 #else
  31390 #define vst2q_s16(__p0, __p1) __extension__ ({ \
  31391   int16x8x2_t __s1 = __p1; \
  31392   int16x8x2_t __rev1; \
  31393   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31394   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31395   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 33); \
  31396 })
  31397 #endif
  31398 
  31399 #ifdef __LITTLE_ENDIAN__
  31400 #define vst2_u8(__p0, __p1) __extension__ ({ \
  31401   uint8x8x2_t __s1 = __p1; \
  31402   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 16); \
  31403 })
  31404 #else
  31405 #define vst2_u8(__p0, __p1) __extension__ ({ \
  31406   uint8x8x2_t __s1 = __p1; \
  31407   uint8x8x2_t __rev1; \
  31408   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31409   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31410   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 16); \
  31411 })
  31412 #endif
  31413 
  31414 #ifdef __LITTLE_ENDIAN__
  31415 #define vst2_u32(__p0, __p1) __extension__ ({ \
  31416   uint32x2x2_t __s1 = __p1; \
  31417   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 18); \
  31418 })
  31419 #else
  31420 #define vst2_u32(__p0, __p1) __extension__ ({ \
  31421   uint32x2x2_t __s1 = __p1; \
  31422   uint32x2x2_t __rev1; \
  31423   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31424   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31425   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 18); \
  31426 })
  31427 #endif
  31428 
  31429 #define vst2_u64(__p0, __p1) __extension__ ({ \
  31430   uint64x1x2_t __s1 = __p1; \
  31431   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 19); \
  31432 })
  31433 #ifdef __LITTLE_ENDIAN__
  31434 #define vst2_u16(__p0, __p1) __extension__ ({ \
  31435   uint16x4x2_t __s1 = __p1; \
  31436   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 17); \
  31437 })
  31438 #else
  31439 #define vst2_u16(__p0, __p1) __extension__ ({ \
  31440   uint16x4x2_t __s1 = __p1; \
  31441   uint16x4x2_t __rev1; \
  31442   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31443   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31444   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 17); \
  31445 })
  31446 #endif
  31447 
  31448 #ifdef __LITTLE_ENDIAN__
  31449 #define vst2_s8(__p0, __p1) __extension__ ({ \
  31450   int8x8x2_t __s1 = __p1; \
  31451   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 0); \
  31452 })
  31453 #else
  31454 #define vst2_s8(__p0, __p1) __extension__ ({ \
  31455   int8x8x2_t __s1 = __p1; \
  31456   int8x8x2_t __rev1; \
  31457   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31458   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31459   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 0); \
  31460 })
  31461 #endif
  31462 
  31463 #ifdef __LITTLE_ENDIAN__
  31464 #define vst2_f32(__p0, __p1) __extension__ ({ \
  31465   float32x2x2_t __s1 = __p1; \
  31466   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 9); \
  31467 })
  31468 #else
  31469 #define vst2_f32(__p0, __p1) __extension__ ({ \
  31470   float32x2x2_t __s1 = __p1; \
  31471   float32x2x2_t __rev1; \
  31472   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31473   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31474   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 9); \
  31475 })
  31476 #endif
  31477 
  31478 #ifdef __LITTLE_ENDIAN__
  31479 #define vst2_s32(__p0, __p1) __extension__ ({ \
  31480   int32x2x2_t __s1 = __p1; \
  31481   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 2); \
  31482 })
  31483 #else
  31484 #define vst2_s32(__p0, __p1) __extension__ ({ \
  31485   int32x2x2_t __s1 = __p1; \
  31486   int32x2x2_t __rev1; \
  31487   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31488   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31489   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 2); \
  31490 })
  31491 #endif
  31492 
  31493 #define vst2_s64(__p0, __p1) __extension__ ({ \
  31494   int64x1x2_t __s1 = __p1; \
  31495   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 3); \
  31496 })
  31497 #ifdef __LITTLE_ENDIAN__
  31498 #define vst2_s16(__p0, __p1) __extension__ ({ \
  31499   int16x4x2_t __s1 = __p1; \
  31500   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 1); \
  31501 })
  31502 #else
  31503 #define vst2_s16(__p0, __p1) __extension__ ({ \
  31504   int16x4x2_t __s1 = __p1; \
  31505   int16x4x2_t __rev1; \
  31506   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31507   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31508   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 1); \
  31509 })
  31510 #endif
  31511 
  31512 #ifdef __LITTLE_ENDIAN__
  31513 #define vst2_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  31514   poly8x8x2_t __s1 = __p1; \
  31515   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 4); \
  31516 })
  31517 #else
  31518 #define vst2_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  31519   poly8x8x2_t __s1 = __p1; \
  31520   poly8x8x2_t __rev1; \
  31521   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31522   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31523   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 4); \
  31524 })
  31525 #endif
  31526 
  31527 #ifdef __LITTLE_ENDIAN__
  31528 #define vst2_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  31529   poly16x4x2_t __s1 = __p1; \
  31530   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 5); \
  31531 })
  31532 #else
  31533 #define vst2_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  31534   poly16x4x2_t __s1 = __p1; \
  31535   poly16x4x2_t __rev1; \
  31536   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31537   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31538   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 5); \
  31539 })
  31540 #endif
  31541 
  31542 #ifdef __LITTLE_ENDIAN__
  31543 #define vst2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  31544   poly16x8x2_t __s1 = __p1; \
  31545   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 37); \
  31546 })
  31547 #else
  31548 #define vst2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  31549   poly16x8x2_t __s1 = __p1; \
  31550   poly16x8x2_t __rev1; \
  31551   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31552   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31553   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 37); \
  31554 })
  31555 #endif
  31556 
  31557 #ifdef __LITTLE_ENDIAN__
  31558 #define vst2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  31559   uint32x4x2_t __s1 = __p1; \
  31560   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 50); \
  31561 })
  31562 #else
  31563 #define vst2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  31564   uint32x4x2_t __s1 = __p1; \
  31565   uint32x4x2_t __rev1; \
  31566   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31567   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31568   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 50); \
  31569 })
  31570 #endif
  31571 
  31572 #ifdef __LITTLE_ENDIAN__
  31573 #define vst2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  31574   uint16x8x2_t __s1 = __p1; \
  31575   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 49); \
  31576 })
  31577 #else
  31578 #define vst2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  31579   uint16x8x2_t __s1 = __p1; \
  31580   uint16x8x2_t __rev1; \
  31581   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31582   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31583   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 49); \
  31584 })
  31585 #endif
  31586 
  31587 #ifdef __LITTLE_ENDIAN__
  31588 #define vst2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  31589   float32x4x2_t __s1 = __p1; \
  31590   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 41); \
  31591 })
  31592 #else
  31593 #define vst2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  31594   float32x4x2_t __s1 = __p1; \
  31595   float32x4x2_t __rev1; \
  31596   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31597   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31598   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 41); \
  31599 })
  31600 #endif
  31601 
  31602 #ifdef __LITTLE_ENDIAN__
  31603 #define vst2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  31604   int32x4x2_t __s1 = __p1; \
  31605   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 34); \
  31606 })
  31607 #else
  31608 #define vst2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  31609   int32x4x2_t __s1 = __p1; \
  31610   int32x4x2_t __rev1; \
  31611   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31612   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31613   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 34); \
  31614 })
  31615 #endif
  31616 
  31617 #ifdef __LITTLE_ENDIAN__
  31618 #define vst2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  31619   int16x8x2_t __s1 = __p1; \
  31620   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 33); \
  31621 })
  31622 #else
  31623 #define vst2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  31624   int16x8x2_t __s1 = __p1; \
  31625   int16x8x2_t __rev1; \
  31626   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31627   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31628   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 33); \
  31629 })
  31630 #endif
  31631 
  31632 #ifdef __LITTLE_ENDIAN__
  31633 #define vst2_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  31634   uint8x8x2_t __s1 = __p1; \
  31635   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 16); \
  31636 })
  31637 #else
  31638 #define vst2_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  31639   uint8x8x2_t __s1 = __p1; \
  31640   uint8x8x2_t __rev1; \
  31641   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31642   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31643   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 16); \
  31644 })
  31645 #endif
  31646 
  31647 #ifdef __LITTLE_ENDIAN__
  31648 #define vst2_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  31649   uint32x2x2_t __s1 = __p1; \
  31650   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 18); \
  31651 })
  31652 #else
  31653 #define vst2_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  31654   uint32x2x2_t __s1 = __p1; \
  31655   uint32x2x2_t __rev1; \
  31656   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31657   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31658   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 18); \
  31659 })
  31660 #endif
  31661 
  31662 #ifdef __LITTLE_ENDIAN__
  31663 #define vst2_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  31664   uint16x4x2_t __s1 = __p1; \
  31665   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 17); \
  31666 })
  31667 #else
  31668 #define vst2_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  31669   uint16x4x2_t __s1 = __p1; \
  31670   uint16x4x2_t __rev1; \
  31671   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31672   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31673   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 17); \
  31674 })
  31675 #endif
  31676 
  31677 #ifdef __LITTLE_ENDIAN__
  31678 #define vst2_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  31679   int8x8x2_t __s1 = __p1; \
  31680   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 0); \
  31681 })
  31682 #else
  31683 #define vst2_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  31684   int8x8x2_t __s1 = __p1; \
  31685   int8x8x2_t __rev1; \
  31686   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31687   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31688   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 0); \
  31689 })
  31690 #endif
  31691 
  31692 #ifdef __LITTLE_ENDIAN__
  31693 #define vst2_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  31694   float32x2x2_t __s1 = __p1; \
  31695   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 9); \
  31696 })
  31697 #else
  31698 #define vst2_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  31699   float32x2x2_t __s1 = __p1; \
  31700   float32x2x2_t __rev1; \
  31701   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31702   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31703   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 9); \
  31704 })
  31705 #endif
  31706 
  31707 #ifdef __LITTLE_ENDIAN__
  31708 #define vst2_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  31709   int32x2x2_t __s1 = __p1; \
  31710   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 2); \
  31711 })
  31712 #else
  31713 #define vst2_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  31714   int32x2x2_t __s1 = __p1; \
  31715   int32x2x2_t __rev1; \
  31716   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31717   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31718   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 2); \
  31719 })
  31720 #endif
  31721 
  31722 #ifdef __LITTLE_ENDIAN__
  31723 #define vst2_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  31724   int16x4x2_t __s1 = __p1; \
  31725   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 1); \
  31726 })
  31727 #else
  31728 #define vst2_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  31729   int16x4x2_t __s1 = __p1; \
  31730   int16x4x2_t __rev1; \
  31731   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31732   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31733   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 1); \
  31734 })
  31735 #endif
  31736 
  31737 #ifdef __LITTLE_ENDIAN__
  31738 #define vst3_p8(__p0, __p1) __extension__ ({ \
  31739   poly8x8x3_t __s1 = __p1; \
  31740   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 4); \
  31741 })
  31742 #else
  31743 #define vst3_p8(__p0, __p1) __extension__ ({ \
  31744   poly8x8x3_t __s1 = __p1; \
  31745   poly8x8x3_t __rev1; \
  31746   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31747   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31748   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31749   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 4); \
  31750 })
  31751 #endif
  31752 
  31753 #ifdef __LITTLE_ENDIAN__
  31754 #define vst3_p16(__p0, __p1) __extension__ ({ \
  31755   poly16x4x3_t __s1 = __p1; \
  31756   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 5); \
  31757 })
  31758 #else
  31759 #define vst3_p16(__p0, __p1) __extension__ ({ \
  31760   poly16x4x3_t __s1 = __p1; \
  31761   poly16x4x3_t __rev1; \
  31762   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31763   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31764   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31765   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 5); \
  31766 })
  31767 #endif
  31768 
  31769 #ifdef __LITTLE_ENDIAN__
  31770 #define vst3q_p8(__p0, __p1) __extension__ ({ \
  31771   poly8x16x3_t __s1 = __p1; \
  31772   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 36); \
  31773 })
  31774 #else
  31775 #define vst3q_p8(__p0, __p1) __extension__ ({ \
  31776   poly8x16x3_t __s1 = __p1; \
  31777   poly8x16x3_t __rev1; \
  31778   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31779   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31780   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31781   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 36); \
  31782 })
  31783 #endif
  31784 
  31785 #ifdef __LITTLE_ENDIAN__
  31786 #define vst3q_p16(__p0, __p1) __extension__ ({ \
  31787   poly16x8x3_t __s1 = __p1; \
  31788   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 37); \
  31789 })
  31790 #else
  31791 #define vst3q_p16(__p0, __p1) __extension__ ({ \
  31792   poly16x8x3_t __s1 = __p1; \
  31793   poly16x8x3_t __rev1; \
  31794   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31795   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31796   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31797   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 37); \
  31798 })
  31799 #endif
  31800 
  31801 #ifdef __LITTLE_ENDIAN__
  31802 #define vst3q_u8(__p0, __p1) __extension__ ({ \
  31803   uint8x16x3_t __s1 = __p1; \
  31804   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 48); \
  31805 })
  31806 #else
  31807 #define vst3q_u8(__p0, __p1) __extension__ ({ \
  31808   uint8x16x3_t __s1 = __p1; \
  31809   uint8x16x3_t __rev1; \
  31810   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31811   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31812   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31813   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 48); \
  31814 })
  31815 #endif
  31816 
  31817 #ifdef __LITTLE_ENDIAN__
  31818 #define vst3q_u32(__p0, __p1) __extension__ ({ \
  31819   uint32x4x3_t __s1 = __p1; \
  31820   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 50); \
  31821 })
  31822 #else
  31823 #define vst3q_u32(__p0, __p1) __extension__ ({ \
  31824   uint32x4x3_t __s1 = __p1; \
  31825   uint32x4x3_t __rev1; \
  31826   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31827   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31828   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31829   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 50); \
  31830 })
  31831 #endif
  31832 
  31833 #ifdef __LITTLE_ENDIAN__
  31834 #define vst3q_u16(__p0, __p1) __extension__ ({ \
  31835   uint16x8x3_t __s1 = __p1; \
  31836   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 49); \
  31837 })
  31838 #else
  31839 #define vst3q_u16(__p0, __p1) __extension__ ({ \
  31840   uint16x8x3_t __s1 = __p1; \
  31841   uint16x8x3_t __rev1; \
  31842   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31843   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31844   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31845   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 49); \
  31846 })
  31847 #endif
  31848 
  31849 #ifdef __LITTLE_ENDIAN__
  31850 #define vst3q_s8(__p0, __p1) __extension__ ({ \
  31851   int8x16x3_t __s1 = __p1; \
  31852   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 32); \
  31853 })
  31854 #else
  31855 #define vst3q_s8(__p0, __p1) __extension__ ({ \
  31856   int8x16x3_t __s1 = __p1; \
  31857   int8x16x3_t __rev1; \
  31858   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31859   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31860   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  31861   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 32); \
  31862 })
  31863 #endif
  31864 
  31865 #ifdef __LITTLE_ENDIAN__
  31866 #define vst3q_f32(__p0, __p1) __extension__ ({ \
  31867   float32x4x3_t __s1 = __p1; \
  31868   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 41); \
  31869 })
  31870 #else
  31871 #define vst3q_f32(__p0, __p1) __extension__ ({ \
  31872   float32x4x3_t __s1 = __p1; \
  31873   float32x4x3_t __rev1; \
  31874   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31875   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31876   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31877   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 41); \
  31878 })
  31879 #endif
  31880 
  31881 #ifdef __LITTLE_ENDIAN__
  31882 #define vst3q_s32(__p0, __p1) __extension__ ({ \
  31883   int32x4x3_t __s1 = __p1; \
  31884   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 34); \
  31885 })
  31886 #else
  31887 #define vst3q_s32(__p0, __p1) __extension__ ({ \
  31888   int32x4x3_t __s1 = __p1; \
  31889   int32x4x3_t __rev1; \
  31890   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31891   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31892   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31893   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 34); \
  31894 })
  31895 #endif
  31896 
  31897 #ifdef __LITTLE_ENDIAN__
  31898 #define vst3q_s16(__p0, __p1) __extension__ ({ \
  31899   int16x8x3_t __s1 = __p1; \
  31900   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 33); \
  31901 })
  31902 #else
  31903 #define vst3q_s16(__p0, __p1) __extension__ ({ \
  31904   int16x8x3_t __s1 = __p1; \
  31905   int16x8x3_t __rev1; \
  31906   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31907   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31908   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31909   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 33); \
  31910 })
  31911 #endif
  31912 
  31913 #ifdef __LITTLE_ENDIAN__
  31914 #define vst3_u8(__p0, __p1) __extension__ ({ \
  31915   uint8x8x3_t __s1 = __p1; \
  31916   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 16); \
  31917 })
  31918 #else
  31919 #define vst3_u8(__p0, __p1) __extension__ ({ \
  31920   uint8x8x3_t __s1 = __p1; \
  31921   uint8x8x3_t __rev1; \
  31922   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31923   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31924   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31925   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 16); \
  31926 })
  31927 #endif
  31928 
  31929 #ifdef __LITTLE_ENDIAN__
  31930 #define vst3_u32(__p0, __p1) __extension__ ({ \
  31931   uint32x2x3_t __s1 = __p1; \
  31932   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 18); \
  31933 })
  31934 #else
  31935 #define vst3_u32(__p0, __p1) __extension__ ({ \
  31936   uint32x2x3_t __s1 = __p1; \
  31937   uint32x2x3_t __rev1; \
  31938   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31939   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31940   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31941   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 18); \
  31942 })
  31943 #endif
  31944 
  31945 #define vst3_u64(__p0, __p1) __extension__ ({ \
  31946   uint64x1x3_t __s1 = __p1; \
  31947   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 19); \
  31948 })
  31949 #ifdef __LITTLE_ENDIAN__
  31950 #define vst3_u16(__p0, __p1) __extension__ ({ \
  31951   uint16x4x3_t __s1 = __p1; \
  31952   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 17); \
  31953 })
  31954 #else
  31955 #define vst3_u16(__p0, __p1) __extension__ ({ \
  31956   uint16x4x3_t __s1 = __p1; \
  31957   uint16x4x3_t __rev1; \
  31958   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  31959   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  31960   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  31961   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 17); \
  31962 })
  31963 #endif
  31964 
  31965 #ifdef __LITTLE_ENDIAN__
  31966 #define vst3_s8(__p0, __p1) __extension__ ({ \
  31967   int8x8x3_t __s1 = __p1; \
  31968   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 0); \
  31969 })
  31970 #else
  31971 #define vst3_s8(__p0, __p1) __extension__ ({ \
  31972   int8x8x3_t __s1 = __p1; \
  31973   int8x8x3_t __rev1; \
  31974   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  31975   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  31976   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  31977   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 0); \
  31978 })
  31979 #endif
  31980 
  31981 #ifdef __LITTLE_ENDIAN__
  31982 #define vst3_f32(__p0, __p1) __extension__ ({ \
  31983   float32x2x3_t __s1 = __p1; \
  31984   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 9); \
  31985 })
  31986 #else
  31987 #define vst3_f32(__p0, __p1) __extension__ ({ \
  31988   float32x2x3_t __s1 = __p1; \
  31989   float32x2x3_t __rev1; \
  31990   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  31991   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  31992   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  31993   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 9); \
  31994 })
  31995 #endif
  31996 
  31997 #ifdef __LITTLE_ENDIAN__
  31998 #define vst3_s32(__p0, __p1) __extension__ ({ \
  31999   int32x2x3_t __s1 = __p1; \
  32000   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 2); \
  32001 })
  32002 #else
  32003 #define vst3_s32(__p0, __p1) __extension__ ({ \
  32004   int32x2x3_t __s1 = __p1; \
  32005   int32x2x3_t __rev1; \
  32006   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32007   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32008   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32009   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 2); \
  32010 })
  32011 #endif
  32012 
  32013 #define vst3_s64(__p0, __p1) __extension__ ({ \
  32014   int64x1x3_t __s1 = __p1; \
  32015   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 3); \
  32016 })
  32017 #ifdef __LITTLE_ENDIAN__
  32018 #define vst3_s16(__p0, __p1) __extension__ ({ \
  32019   int16x4x3_t __s1 = __p1; \
  32020   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 1); \
  32021 })
  32022 #else
  32023 #define vst3_s16(__p0, __p1) __extension__ ({ \
  32024   int16x4x3_t __s1 = __p1; \
  32025   int16x4x3_t __rev1; \
  32026   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32027   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32028   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32029   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 1); \
  32030 })
  32031 #endif
  32032 
  32033 #ifdef __LITTLE_ENDIAN__
  32034 #define vst3_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  32035   poly8x8x3_t __s1 = __p1; \
  32036   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 4); \
  32037 })
  32038 #else
  32039 #define vst3_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  32040   poly8x8x3_t __s1 = __p1; \
  32041   poly8x8x3_t __rev1; \
  32042   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32043   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32044   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32045   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 4); \
  32046 })
  32047 #endif
  32048 
  32049 #ifdef __LITTLE_ENDIAN__
  32050 #define vst3_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32051   poly16x4x3_t __s1 = __p1; \
  32052   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 5); \
  32053 })
  32054 #else
  32055 #define vst3_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32056   poly16x4x3_t __s1 = __p1; \
  32057   poly16x4x3_t __rev1; \
  32058   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32059   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32060   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32061   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 5); \
  32062 })
  32063 #endif
  32064 
  32065 #ifdef __LITTLE_ENDIAN__
  32066 #define vst3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32067   poly16x8x3_t __s1 = __p1; \
  32068   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 37); \
  32069 })
  32070 #else
  32071 #define vst3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32072   poly16x8x3_t __s1 = __p1; \
  32073   poly16x8x3_t __rev1; \
  32074   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32075   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32076   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32077   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 37); \
  32078 })
  32079 #endif
  32080 
  32081 #ifdef __LITTLE_ENDIAN__
  32082 #define vst3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32083   uint32x4x3_t __s1 = __p1; \
  32084   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 50); \
  32085 })
  32086 #else
  32087 #define vst3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32088   uint32x4x3_t __s1 = __p1; \
  32089   uint32x4x3_t __rev1; \
  32090   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32091   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32092   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32093   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 50); \
  32094 })
  32095 #endif
  32096 
  32097 #ifdef __LITTLE_ENDIAN__
  32098 #define vst3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32099   uint16x8x3_t __s1 = __p1; \
  32100   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 49); \
  32101 })
  32102 #else
  32103 #define vst3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32104   uint16x8x3_t __s1 = __p1; \
  32105   uint16x8x3_t __rev1; \
  32106   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32107   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32108   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32109   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 49); \
  32110 })
  32111 #endif
  32112 
  32113 #ifdef __LITTLE_ENDIAN__
  32114 #define vst3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32115   float32x4x3_t __s1 = __p1; \
  32116   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 41); \
  32117 })
  32118 #else
  32119 #define vst3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32120   float32x4x3_t __s1 = __p1; \
  32121   float32x4x3_t __rev1; \
  32122   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32123   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32124   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32125   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 41); \
  32126 })
  32127 #endif
  32128 
  32129 #ifdef __LITTLE_ENDIAN__
  32130 #define vst3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32131   int32x4x3_t __s1 = __p1; \
  32132   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 34); \
  32133 })
  32134 #else
  32135 #define vst3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32136   int32x4x3_t __s1 = __p1; \
  32137   int32x4x3_t __rev1; \
  32138   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32139   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32140   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32141   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 34); \
  32142 })
  32143 #endif
  32144 
  32145 #ifdef __LITTLE_ENDIAN__
  32146 #define vst3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32147   int16x8x3_t __s1 = __p1; \
  32148   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 33); \
  32149 })
  32150 #else
  32151 #define vst3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32152   int16x8x3_t __s1 = __p1; \
  32153   int16x8x3_t __rev1; \
  32154   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32155   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32156   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32157   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 33); \
  32158 })
  32159 #endif
  32160 
  32161 #ifdef __LITTLE_ENDIAN__
  32162 #define vst3_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  32163   uint8x8x3_t __s1 = __p1; \
  32164   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 16); \
  32165 })
  32166 #else
  32167 #define vst3_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  32168   uint8x8x3_t __s1 = __p1; \
  32169   uint8x8x3_t __rev1; \
  32170   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32171   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32172   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32173   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 16); \
  32174 })
  32175 #endif
  32176 
  32177 #ifdef __LITTLE_ENDIAN__
  32178 #define vst3_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32179   uint32x2x3_t __s1 = __p1; \
  32180   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 18); \
  32181 })
  32182 #else
  32183 #define vst3_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32184   uint32x2x3_t __s1 = __p1; \
  32185   uint32x2x3_t __rev1; \
  32186   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32187   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32188   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32189   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 18); \
  32190 })
  32191 #endif
  32192 
  32193 #ifdef __LITTLE_ENDIAN__
  32194 #define vst3_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32195   uint16x4x3_t __s1 = __p1; \
  32196   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 17); \
  32197 })
  32198 #else
  32199 #define vst3_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32200   uint16x4x3_t __s1 = __p1; \
  32201   uint16x4x3_t __rev1; \
  32202   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32203   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32204   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32205   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 17); \
  32206 })
  32207 #endif
  32208 
  32209 #ifdef __LITTLE_ENDIAN__
  32210 #define vst3_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  32211   int8x8x3_t __s1 = __p1; \
  32212   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 0); \
  32213 })
  32214 #else
  32215 #define vst3_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  32216   int8x8x3_t __s1 = __p1; \
  32217   int8x8x3_t __rev1; \
  32218   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32219   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32220   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32221   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 0); \
  32222 })
  32223 #endif
  32224 
  32225 #ifdef __LITTLE_ENDIAN__
  32226 #define vst3_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32227   float32x2x3_t __s1 = __p1; \
  32228   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 9); \
  32229 })
  32230 #else
  32231 #define vst3_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32232   float32x2x3_t __s1 = __p1; \
  32233   float32x2x3_t __rev1; \
  32234   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32235   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32236   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32237   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 9); \
  32238 })
  32239 #endif
  32240 
  32241 #ifdef __LITTLE_ENDIAN__
  32242 #define vst3_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32243   int32x2x3_t __s1 = __p1; \
  32244   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 2); \
  32245 })
  32246 #else
  32247 #define vst3_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32248   int32x2x3_t __s1 = __p1; \
  32249   int32x2x3_t __rev1; \
  32250   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32251   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32252   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32253   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 2); \
  32254 })
  32255 #endif
  32256 
  32257 #ifdef __LITTLE_ENDIAN__
  32258 #define vst3_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32259   int16x4x3_t __s1 = __p1; \
  32260   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 1); \
  32261 })
  32262 #else
  32263 #define vst3_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32264   int16x4x3_t __s1 = __p1; \
  32265   int16x4x3_t __rev1; \
  32266   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32267   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32268   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32269   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 1); \
  32270 })
  32271 #endif
  32272 
  32273 #ifdef __LITTLE_ENDIAN__
  32274 #define vst4_p8(__p0, __p1) __extension__ ({ \
  32275   poly8x8x4_t __s1 = __p1; \
  32276   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 4); \
  32277 })
  32278 #else
  32279 #define vst4_p8(__p0, __p1) __extension__ ({ \
  32280   poly8x8x4_t __s1 = __p1; \
  32281   poly8x8x4_t __rev1; \
  32282   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32283   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32284   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32285   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32286   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 4); \
  32287 })
  32288 #endif
  32289 
  32290 #ifdef __LITTLE_ENDIAN__
  32291 #define vst4_p16(__p0, __p1) __extension__ ({ \
  32292   poly16x4x4_t __s1 = __p1; \
  32293   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 5); \
  32294 })
  32295 #else
  32296 #define vst4_p16(__p0, __p1) __extension__ ({ \
  32297   poly16x4x4_t __s1 = __p1; \
  32298   poly16x4x4_t __rev1; \
  32299   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32300   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32301   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32302   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32303   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 5); \
  32304 })
  32305 #endif
  32306 
  32307 #ifdef __LITTLE_ENDIAN__
  32308 #define vst4q_p8(__p0, __p1) __extension__ ({ \
  32309   poly8x16x4_t __s1 = __p1; \
  32310   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 36); \
  32311 })
  32312 #else
  32313 #define vst4q_p8(__p0, __p1) __extension__ ({ \
  32314   poly8x16x4_t __s1 = __p1; \
  32315   poly8x16x4_t __rev1; \
  32316   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32317   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32318   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32319   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32320   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 36); \
  32321 })
  32322 #endif
  32323 
  32324 #ifdef __LITTLE_ENDIAN__
  32325 #define vst4q_p16(__p0, __p1) __extension__ ({ \
  32326   poly16x8x4_t __s1 = __p1; \
  32327   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 37); \
  32328 })
  32329 #else
  32330 #define vst4q_p16(__p0, __p1) __extension__ ({ \
  32331   poly16x8x4_t __s1 = __p1; \
  32332   poly16x8x4_t __rev1; \
  32333   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32334   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32335   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32336   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32337   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 37); \
  32338 })
  32339 #endif
  32340 
  32341 #ifdef __LITTLE_ENDIAN__
  32342 #define vst4q_u8(__p0, __p1) __extension__ ({ \
  32343   uint8x16x4_t __s1 = __p1; \
  32344   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 48); \
  32345 })
  32346 #else
  32347 #define vst4q_u8(__p0, __p1) __extension__ ({ \
  32348   uint8x16x4_t __s1 = __p1; \
  32349   uint8x16x4_t __rev1; \
  32350   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32351   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32352   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32353   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32354   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 48); \
  32355 })
  32356 #endif
  32357 
  32358 #ifdef __LITTLE_ENDIAN__
  32359 #define vst4q_u32(__p0, __p1) __extension__ ({ \
  32360   uint32x4x4_t __s1 = __p1; \
  32361   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 50); \
  32362 })
  32363 #else
  32364 #define vst4q_u32(__p0, __p1) __extension__ ({ \
  32365   uint32x4x4_t __s1 = __p1; \
  32366   uint32x4x4_t __rev1; \
  32367   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32368   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32369   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32370   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32371   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 50); \
  32372 })
  32373 #endif
  32374 
  32375 #ifdef __LITTLE_ENDIAN__
  32376 #define vst4q_u16(__p0, __p1) __extension__ ({ \
  32377   uint16x8x4_t __s1 = __p1; \
  32378   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 49); \
  32379 })
  32380 #else
  32381 #define vst4q_u16(__p0, __p1) __extension__ ({ \
  32382   uint16x8x4_t __s1 = __p1; \
  32383   uint16x8x4_t __rev1; \
  32384   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32385   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32386   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32387   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32388   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 49); \
  32389 })
  32390 #endif
  32391 
  32392 #ifdef __LITTLE_ENDIAN__
  32393 #define vst4q_s8(__p0, __p1) __extension__ ({ \
  32394   int8x16x4_t __s1 = __p1; \
  32395   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 32); \
  32396 })
  32397 #else
  32398 #define vst4q_s8(__p0, __p1) __extension__ ({ \
  32399   int8x16x4_t __s1 = __p1; \
  32400   int8x16x4_t __rev1; \
  32401   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32402   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32403   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32404   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  32405   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 32); \
  32406 })
  32407 #endif
  32408 
  32409 #ifdef __LITTLE_ENDIAN__
  32410 #define vst4q_f32(__p0, __p1) __extension__ ({ \
  32411   float32x4x4_t __s1 = __p1; \
  32412   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 41); \
  32413 })
  32414 #else
  32415 #define vst4q_f32(__p0, __p1) __extension__ ({ \
  32416   float32x4x4_t __s1 = __p1; \
  32417   float32x4x4_t __rev1; \
  32418   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32419   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32420   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32421   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32422   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 41); \
  32423 })
  32424 #endif
  32425 
  32426 #ifdef __LITTLE_ENDIAN__
  32427 #define vst4q_s32(__p0, __p1) __extension__ ({ \
  32428   int32x4x4_t __s1 = __p1; \
  32429   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 34); \
  32430 })
  32431 #else
  32432 #define vst4q_s32(__p0, __p1) __extension__ ({ \
  32433   int32x4x4_t __s1 = __p1; \
  32434   int32x4x4_t __rev1; \
  32435   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32436   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32437   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32438   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32439   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 34); \
  32440 })
  32441 #endif
  32442 
  32443 #ifdef __LITTLE_ENDIAN__
  32444 #define vst4q_s16(__p0, __p1) __extension__ ({ \
  32445   int16x8x4_t __s1 = __p1; \
  32446   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 33); \
  32447 })
  32448 #else
  32449 #define vst4q_s16(__p0, __p1) __extension__ ({ \
  32450   int16x8x4_t __s1 = __p1; \
  32451   int16x8x4_t __rev1; \
  32452   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32453   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32454   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32455   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32456   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 33); \
  32457 })
  32458 #endif
  32459 
  32460 #ifdef __LITTLE_ENDIAN__
  32461 #define vst4_u8(__p0, __p1) __extension__ ({ \
  32462   uint8x8x4_t __s1 = __p1; \
  32463   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 16); \
  32464 })
  32465 #else
  32466 #define vst4_u8(__p0, __p1) __extension__ ({ \
  32467   uint8x8x4_t __s1 = __p1; \
  32468   uint8x8x4_t __rev1; \
  32469   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32470   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32471   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32472   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32473   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 16); \
  32474 })
  32475 #endif
  32476 
  32477 #ifdef __LITTLE_ENDIAN__
  32478 #define vst4_u32(__p0, __p1) __extension__ ({ \
  32479   uint32x2x4_t __s1 = __p1; \
  32480   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 18); \
  32481 })
  32482 #else
  32483 #define vst4_u32(__p0, __p1) __extension__ ({ \
  32484   uint32x2x4_t __s1 = __p1; \
  32485   uint32x2x4_t __rev1; \
  32486   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32487   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32488   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32489   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  32490   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 18); \
  32491 })
  32492 #endif
  32493 
  32494 #define vst4_u64(__p0, __p1) __extension__ ({ \
  32495   uint64x1x4_t __s1 = __p1; \
  32496   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 19); \
  32497 })
  32498 #ifdef __LITTLE_ENDIAN__
  32499 #define vst4_u16(__p0, __p1) __extension__ ({ \
  32500   uint16x4x4_t __s1 = __p1; \
  32501   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 17); \
  32502 })
  32503 #else
  32504 #define vst4_u16(__p0, __p1) __extension__ ({ \
  32505   uint16x4x4_t __s1 = __p1; \
  32506   uint16x4x4_t __rev1; \
  32507   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32508   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32509   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32510   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32511   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 17); \
  32512 })
  32513 #endif
  32514 
  32515 #ifdef __LITTLE_ENDIAN__
  32516 #define vst4_s8(__p0, __p1) __extension__ ({ \
  32517   int8x8x4_t __s1 = __p1; \
  32518   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 0); \
  32519 })
  32520 #else
  32521 #define vst4_s8(__p0, __p1) __extension__ ({ \
  32522   int8x8x4_t __s1 = __p1; \
  32523   int8x8x4_t __rev1; \
  32524   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32525   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32526   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32527   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32528   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 0); \
  32529 })
  32530 #endif
  32531 
  32532 #ifdef __LITTLE_ENDIAN__
  32533 #define vst4_f32(__p0, __p1) __extension__ ({ \
  32534   float32x2x4_t __s1 = __p1; \
  32535   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 9); \
  32536 })
  32537 #else
  32538 #define vst4_f32(__p0, __p1) __extension__ ({ \
  32539   float32x2x4_t __s1 = __p1; \
  32540   float32x2x4_t __rev1; \
  32541   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32542   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32543   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32544   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  32545   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 9); \
  32546 })
  32547 #endif
  32548 
  32549 #ifdef __LITTLE_ENDIAN__
  32550 #define vst4_s32(__p0, __p1) __extension__ ({ \
  32551   int32x2x4_t __s1 = __p1; \
  32552   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 2); \
  32553 })
  32554 #else
  32555 #define vst4_s32(__p0, __p1) __extension__ ({ \
  32556   int32x2x4_t __s1 = __p1; \
  32557   int32x2x4_t __rev1; \
  32558   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32559   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32560   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32561   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  32562   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 2); \
  32563 })
  32564 #endif
  32565 
  32566 #define vst4_s64(__p0, __p1) __extension__ ({ \
  32567   int64x1x4_t __s1 = __p1; \
  32568   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 3); \
  32569 })
  32570 #ifdef __LITTLE_ENDIAN__
  32571 #define vst4_s16(__p0, __p1) __extension__ ({ \
  32572   int16x4x4_t __s1 = __p1; \
  32573   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 1); \
  32574 })
  32575 #else
  32576 #define vst4_s16(__p0, __p1) __extension__ ({ \
  32577   int16x4x4_t __s1 = __p1; \
  32578   int16x4x4_t __rev1; \
  32579   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32580   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32581   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32582   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32583   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 1); \
  32584 })
  32585 #endif
  32586 
  32587 #ifdef __LITTLE_ENDIAN__
  32588 #define vst4_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  32589   poly8x8x4_t __s1 = __p1; \
  32590   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 4); \
  32591 })
  32592 #else
  32593 #define vst4_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  32594   poly8x8x4_t __s1 = __p1; \
  32595   poly8x8x4_t __rev1; \
  32596   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32597   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32598   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32599   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32600   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 4); \
  32601 })
  32602 #endif
  32603 
  32604 #ifdef __LITTLE_ENDIAN__
  32605 #define vst4_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32606   poly16x4x4_t __s1 = __p1; \
  32607   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 5); \
  32608 })
  32609 #else
  32610 #define vst4_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32611   poly16x4x4_t __s1 = __p1; \
  32612   poly16x4x4_t __rev1; \
  32613   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32614   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32615   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32616   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32617   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 5); \
  32618 })
  32619 #endif
  32620 
  32621 #ifdef __LITTLE_ENDIAN__
  32622 #define vst4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32623   poly16x8x4_t __s1 = __p1; \
  32624   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 37); \
  32625 })
  32626 #else
  32627 #define vst4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  32628   poly16x8x4_t __s1 = __p1; \
  32629   poly16x8x4_t __rev1; \
  32630   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32631   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32632   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32633   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32634   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 37); \
  32635 })
  32636 #endif
  32637 
  32638 #ifdef __LITTLE_ENDIAN__
  32639 #define vst4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32640   uint32x4x4_t __s1 = __p1; \
  32641   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 50); \
  32642 })
  32643 #else
  32644 #define vst4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32645   uint32x4x4_t __s1 = __p1; \
  32646   uint32x4x4_t __rev1; \
  32647   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32648   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32649   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32650   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32651   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 50); \
  32652 })
  32653 #endif
  32654 
  32655 #ifdef __LITTLE_ENDIAN__
  32656 #define vst4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32657   uint16x8x4_t __s1 = __p1; \
  32658   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 49); \
  32659 })
  32660 #else
  32661 #define vst4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32662   uint16x8x4_t __s1 = __p1; \
  32663   uint16x8x4_t __rev1; \
  32664   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32665   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32666   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32667   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32668   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 49); \
  32669 })
  32670 #endif
  32671 
  32672 #ifdef __LITTLE_ENDIAN__
  32673 #define vst4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32674   float32x4x4_t __s1 = __p1; \
  32675   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 41); \
  32676 })
  32677 #else
  32678 #define vst4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32679   float32x4x4_t __s1 = __p1; \
  32680   float32x4x4_t __rev1; \
  32681   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32682   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32683   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32684   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32685   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 41); \
  32686 })
  32687 #endif
  32688 
  32689 #ifdef __LITTLE_ENDIAN__
  32690 #define vst4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32691   int32x4x4_t __s1 = __p1; \
  32692   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 34); \
  32693 })
  32694 #else
  32695 #define vst4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32696   int32x4x4_t __s1 = __p1; \
  32697   int32x4x4_t __rev1; \
  32698   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32699   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32700   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32701   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32702   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 34); \
  32703 })
  32704 #endif
  32705 
  32706 #ifdef __LITTLE_ENDIAN__
  32707 #define vst4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32708   int16x8x4_t __s1 = __p1; \
  32709   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 33); \
  32710 })
  32711 #else
  32712 #define vst4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32713   int16x8x4_t __s1 = __p1; \
  32714   int16x8x4_t __rev1; \
  32715   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32716   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32717   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32718   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32719   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 33); \
  32720 })
  32721 #endif
  32722 
  32723 #ifdef __LITTLE_ENDIAN__
  32724 #define vst4_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  32725   uint8x8x4_t __s1 = __p1; \
  32726   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 16); \
  32727 })
  32728 #else
  32729 #define vst4_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  32730   uint8x8x4_t __s1 = __p1; \
  32731   uint8x8x4_t __rev1; \
  32732   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32733   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32734   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32735   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32736   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 16); \
  32737 })
  32738 #endif
  32739 
  32740 #ifdef __LITTLE_ENDIAN__
  32741 #define vst4_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32742   uint32x2x4_t __s1 = __p1; \
  32743   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 18); \
  32744 })
  32745 #else
  32746 #define vst4_lane_u32(__p0, __p1, __p2) __extension__ ({ \
  32747   uint32x2x4_t __s1 = __p1; \
  32748   uint32x2x4_t __rev1; \
  32749   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32750   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32751   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32752   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  32753   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 18); \
  32754 })
  32755 #endif
  32756 
  32757 #ifdef __LITTLE_ENDIAN__
  32758 #define vst4_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32759   uint16x4x4_t __s1 = __p1; \
  32760   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 17); \
  32761 })
  32762 #else
  32763 #define vst4_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  32764   uint16x4x4_t __s1 = __p1; \
  32765   uint16x4x4_t __rev1; \
  32766   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32767   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32768   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32769   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32770   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 17); \
  32771 })
  32772 #endif
  32773 
  32774 #ifdef __LITTLE_ENDIAN__
  32775 #define vst4_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  32776   int8x8x4_t __s1 = __p1; \
  32777   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 0); \
  32778 })
  32779 #else
  32780 #define vst4_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  32781   int8x8x4_t __s1 = __p1; \
  32782   int8x8x4_t __rev1; \
  32783   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  32784   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  32785   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  32786   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  32787   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 0); \
  32788 })
  32789 #endif
  32790 
  32791 #ifdef __LITTLE_ENDIAN__
  32792 #define vst4_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32793   float32x2x4_t __s1 = __p1; \
  32794   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 9); \
  32795 })
  32796 #else
  32797 #define vst4_lane_f32(__p0, __p1, __p2) __extension__ ({ \
  32798   float32x2x4_t __s1 = __p1; \
  32799   float32x2x4_t __rev1; \
  32800   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32801   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32802   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32803   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  32804   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 9); \
  32805 })
  32806 #endif
  32807 
  32808 #ifdef __LITTLE_ENDIAN__
  32809 #define vst4_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32810   int32x2x4_t __s1 = __p1; \
  32811   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 2); \
  32812 })
  32813 #else
  32814 #define vst4_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  32815   int32x2x4_t __s1 = __p1; \
  32816   int32x2x4_t __rev1; \
  32817   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  32818   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  32819   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  32820   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  32821   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 2); \
  32822 })
  32823 #endif
  32824 
  32825 #ifdef __LITTLE_ENDIAN__
  32826 #define vst4_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32827   int16x4x4_t __s1 = __p1; \
  32828   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 1); \
  32829 })
  32830 #else
  32831 #define vst4_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  32832   int16x4x4_t __s1 = __p1; \
  32833   int16x4x4_t __rev1; \
  32834   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  32835   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  32836   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  32837   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  32838   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 1); \
  32839 })
  32840 #endif
  32841 
  32842 #ifdef __LITTLE_ENDIAN__
  32843 __ai __attribute__((target("neon"))) uint8x16_t vsubq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  32844   uint8x16_t __ret;
  32845   __ret = __p0 - __p1;
  32846   return __ret;
  32847 }
  32848 #else
  32849 __ai __attribute__((target("neon"))) uint8x16_t vsubq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  32850   uint8x16_t __ret;
  32851   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  32852   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  32853   __ret = __rev0 - __rev1;
  32854   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  32855   return __ret;
  32856 }
  32857 #endif
  32858 
  32859 #ifdef __LITTLE_ENDIAN__
  32860 __ai __attribute__((target("neon"))) uint32x4_t vsubq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  32861   uint32x4_t __ret;
  32862   __ret = __p0 - __p1;
  32863   return __ret;
  32864 }
  32865 #else
  32866 __ai __attribute__((target("neon"))) uint32x4_t vsubq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  32867   uint32x4_t __ret;
  32868   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  32869   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  32870   __ret = __rev0 - __rev1;
  32871   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  32872   return __ret;
  32873 }
  32874 #endif
  32875 
  32876 #ifdef __LITTLE_ENDIAN__
  32877 __ai __attribute__((target("neon"))) uint64x2_t vsubq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  32878   uint64x2_t __ret;
  32879   __ret = __p0 - __p1;
  32880   return __ret;
  32881 }
  32882 #else
  32883 __ai __attribute__((target("neon"))) uint64x2_t vsubq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  32884   uint64x2_t __ret;
  32885   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  32886   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  32887   __ret = __rev0 - __rev1;
  32888   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  32889   return __ret;
  32890 }
  32891 #endif
  32892 
  32893 #ifdef __LITTLE_ENDIAN__
  32894 __ai __attribute__((target("neon"))) uint16x8_t vsubq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  32895   uint16x8_t __ret;
  32896   __ret = __p0 - __p1;
  32897   return __ret;
  32898 }
  32899 #else
  32900 __ai __attribute__((target("neon"))) uint16x8_t vsubq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  32901   uint16x8_t __ret;
  32902   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  32903   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  32904   __ret = __rev0 - __rev1;
  32905   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  32906   return __ret;
  32907 }
  32908 #endif
  32909 
  32910 #ifdef __LITTLE_ENDIAN__
  32911 __ai __attribute__((target("neon"))) int8x16_t vsubq_s8(int8x16_t __p0, int8x16_t __p1) {
  32912   int8x16_t __ret;
  32913   __ret = __p0 - __p1;
  32914   return __ret;
  32915 }
  32916 #else
  32917 __ai __attribute__((target("neon"))) int8x16_t vsubq_s8(int8x16_t __p0, int8x16_t __p1) {
  32918   int8x16_t __ret;
  32919   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  32920   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  32921   __ret = __rev0 - __rev1;
  32922   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  32923   return __ret;
  32924 }
  32925 #endif
  32926 
  32927 #ifdef __LITTLE_ENDIAN__
  32928 __ai __attribute__((target("neon"))) float32x4_t vsubq_f32(float32x4_t __p0, float32x4_t __p1) {
  32929   float32x4_t __ret;
  32930   __ret = __p0 - __p1;
  32931   return __ret;
  32932 }
  32933 #else
  32934 __ai __attribute__((target("neon"))) float32x4_t vsubq_f32(float32x4_t __p0, float32x4_t __p1) {
  32935   float32x4_t __ret;
  32936   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  32937   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  32938   __ret = __rev0 - __rev1;
  32939   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  32940   return __ret;
  32941 }
  32942 #endif
  32943 
  32944 #ifdef __LITTLE_ENDIAN__
  32945 __ai __attribute__((target("neon"))) int32x4_t vsubq_s32(int32x4_t __p0, int32x4_t __p1) {
  32946   int32x4_t __ret;
  32947   __ret = __p0 - __p1;
  32948   return __ret;
  32949 }
  32950 #else
  32951 __ai __attribute__((target("neon"))) int32x4_t vsubq_s32(int32x4_t __p0, int32x4_t __p1) {
  32952   int32x4_t __ret;
  32953   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  32954   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  32955   __ret = __rev0 - __rev1;
  32956   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  32957   return __ret;
  32958 }
  32959 #endif
  32960 
  32961 #ifdef __LITTLE_ENDIAN__
  32962 __ai __attribute__((target("neon"))) int64x2_t vsubq_s64(int64x2_t __p0, int64x2_t __p1) {
  32963   int64x2_t __ret;
  32964   __ret = __p0 - __p1;
  32965   return __ret;
  32966 }
  32967 #else
  32968 __ai __attribute__((target("neon"))) int64x2_t vsubq_s64(int64x2_t __p0, int64x2_t __p1) {
  32969   int64x2_t __ret;
  32970   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  32971   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  32972   __ret = __rev0 - __rev1;
  32973   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  32974   return __ret;
  32975 }
  32976 #endif
  32977 
  32978 #ifdef __LITTLE_ENDIAN__
  32979 __ai __attribute__((target("neon"))) int16x8_t vsubq_s16(int16x8_t __p0, int16x8_t __p1) {
  32980   int16x8_t __ret;
  32981   __ret = __p0 - __p1;
  32982   return __ret;
  32983 }
  32984 #else
  32985 __ai __attribute__((target("neon"))) int16x8_t vsubq_s16(int16x8_t __p0, int16x8_t __p1) {
  32986   int16x8_t __ret;
  32987   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  32988   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  32989   __ret = __rev0 - __rev1;
  32990   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  32991   return __ret;
  32992 }
  32993 #endif
  32994 
  32995 #ifdef __LITTLE_ENDIAN__
  32996 __ai __attribute__((target("neon"))) uint8x8_t vsub_u8(uint8x8_t __p0, uint8x8_t __p1) {
  32997   uint8x8_t __ret;
  32998   __ret = __p0 - __p1;
  32999   return __ret;
  33000 }
  33001 #else
  33002 __ai __attribute__((target("neon"))) uint8x8_t vsub_u8(uint8x8_t __p0, uint8x8_t __p1) {
  33003   uint8x8_t __ret;
  33004   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33005   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33006   __ret = __rev0 - __rev1;
  33007   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33008   return __ret;
  33009 }
  33010 #endif
  33011 
  33012 #ifdef __LITTLE_ENDIAN__
  33013 __ai __attribute__((target("neon"))) uint32x2_t vsub_u32(uint32x2_t __p0, uint32x2_t __p1) {
  33014   uint32x2_t __ret;
  33015   __ret = __p0 - __p1;
  33016   return __ret;
  33017 }
  33018 #else
  33019 __ai __attribute__((target("neon"))) uint32x2_t vsub_u32(uint32x2_t __p0, uint32x2_t __p1) {
  33020   uint32x2_t __ret;
  33021   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33022   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33023   __ret = __rev0 - __rev1;
  33024   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33025   return __ret;
  33026 }
  33027 #endif
  33028 
  33029 __ai __attribute__((target("neon"))) uint64x1_t vsub_u64(uint64x1_t __p0, uint64x1_t __p1) {
  33030   uint64x1_t __ret;
  33031   __ret = __p0 - __p1;
  33032   return __ret;
  33033 }
  33034 #ifdef __LITTLE_ENDIAN__
  33035 __ai __attribute__((target("neon"))) uint16x4_t vsub_u16(uint16x4_t __p0, uint16x4_t __p1) {
  33036   uint16x4_t __ret;
  33037   __ret = __p0 - __p1;
  33038   return __ret;
  33039 }
  33040 #else
  33041 __ai __attribute__((target("neon"))) uint16x4_t vsub_u16(uint16x4_t __p0, uint16x4_t __p1) {
  33042   uint16x4_t __ret;
  33043   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33044   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33045   __ret = __rev0 - __rev1;
  33046   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33047   return __ret;
  33048 }
  33049 #endif
  33050 
  33051 #ifdef __LITTLE_ENDIAN__
  33052 __ai __attribute__((target("neon"))) int8x8_t vsub_s8(int8x8_t __p0, int8x8_t __p1) {
  33053   int8x8_t __ret;
  33054   __ret = __p0 - __p1;
  33055   return __ret;
  33056 }
  33057 #else
  33058 __ai __attribute__((target("neon"))) int8x8_t vsub_s8(int8x8_t __p0, int8x8_t __p1) {
  33059   int8x8_t __ret;
  33060   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33061   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33062   __ret = __rev0 - __rev1;
  33063   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33064   return __ret;
  33065 }
  33066 #endif
  33067 
  33068 #ifdef __LITTLE_ENDIAN__
  33069 __ai __attribute__((target("neon"))) float32x2_t vsub_f32(float32x2_t __p0, float32x2_t __p1) {
  33070   float32x2_t __ret;
  33071   __ret = __p0 - __p1;
  33072   return __ret;
  33073 }
  33074 #else
  33075 __ai __attribute__((target("neon"))) float32x2_t vsub_f32(float32x2_t __p0, float32x2_t __p1) {
  33076   float32x2_t __ret;
  33077   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33078   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33079   __ret = __rev0 - __rev1;
  33080   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33081   return __ret;
  33082 }
  33083 #endif
  33084 
  33085 #ifdef __LITTLE_ENDIAN__
  33086 __ai __attribute__((target("neon"))) int32x2_t vsub_s32(int32x2_t __p0, int32x2_t __p1) {
  33087   int32x2_t __ret;
  33088   __ret = __p0 - __p1;
  33089   return __ret;
  33090 }
  33091 #else
  33092 __ai __attribute__((target("neon"))) int32x2_t vsub_s32(int32x2_t __p0, int32x2_t __p1) {
  33093   int32x2_t __ret;
  33094   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33095   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33096   __ret = __rev0 - __rev1;
  33097   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33098   return __ret;
  33099 }
  33100 #endif
  33101 
  33102 __ai __attribute__((target("neon"))) int64x1_t vsub_s64(int64x1_t __p0, int64x1_t __p1) {
  33103   int64x1_t __ret;
  33104   __ret = __p0 - __p1;
  33105   return __ret;
  33106 }
  33107 #ifdef __LITTLE_ENDIAN__
  33108 __ai __attribute__((target("neon"))) int16x4_t vsub_s16(int16x4_t __p0, int16x4_t __p1) {
  33109   int16x4_t __ret;
  33110   __ret = __p0 - __p1;
  33111   return __ret;
  33112 }
  33113 #else
  33114 __ai __attribute__((target("neon"))) int16x4_t vsub_s16(int16x4_t __p0, int16x4_t __p1) {
  33115   int16x4_t __ret;
  33116   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33117   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33118   __ret = __rev0 - __rev1;
  33119   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33120   return __ret;
  33121 }
  33122 #endif
  33123 
  33124 #ifdef __LITTLE_ENDIAN__
  33125 __ai __attribute__((target("neon"))) uint16x4_t vsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  33126   uint16x4_t __ret;
  33127   __ret = (uint16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
  33128   return __ret;
  33129 }
  33130 #else
  33131 __ai __attribute__((target("neon"))) uint16x4_t vsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  33132   uint16x4_t __ret;
  33133   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33134   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33135   __ret = (uint16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17);
  33136   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33137   return __ret;
  33138 }
  33139 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) {
  33140   uint16x4_t __ret;
  33141   __ret = (uint16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17);
  33142   return __ret;
  33143 }
  33144 #endif
  33145 
  33146 #ifdef __LITTLE_ENDIAN__
  33147 __ai __attribute__((target("neon"))) uint32x2_t vsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  33148   uint32x2_t __ret;
  33149   __ret = (uint32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
  33150   return __ret;
  33151 }
  33152 #else
  33153 __ai __attribute__((target("neon"))) uint32x2_t vsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  33154   uint32x2_t __ret;
  33155   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33156   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33157   __ret = (uint32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18);
  33158   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33159   return __ret;
  33160 }
  33161 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) {
  33162   uint32x2_t __ret;
  33163   __ret = (uint32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18);
  33164   return __ret;
  33165 }
  33166 #endif
  33167 
  33168 #ifdef __LITTLE_ENDIAN__
  33169 __ai __attribute__((target("neon"))) uint8x8_t vsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  33170   uint8x8_t __ret;
  33171   __ret = (uint8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
  33172   return __ret;
  33173 }
  33174 #else
  33175 __ai __attribute__((target("neon"))) uint8x8_t vsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  33176   uint8x8_t __ret;
  33177   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33178   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33179   __ret = (uint8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16);
  33180   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33181   return __ret;
  33182 }
  33183 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) {
  33184   uint8x8_t __ret;
  33185   __ret = (uint8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16);
  33186   return __ret;
  33187 }
  33188 #endif
  33189 
  33190 #ifdef __LITTLE_ENDIAN__
  33191 __ai __attribute__((target("neon"))) int16x4_t vsubhn_s32(int32x4_t __p0, int32x4_t __p1) {
  33192   int16x4_t __ret;
  33193   __ret = (int16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
  33194   return __ret;
  33195 }
  33196 #else
  33197 __ai __attribute__((target("neon"))) int16x4_t vsubhn_s32(int32x4_t __p0, int32x4_t __p1) {
  33198   int16x4_t __ret;
  33199   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33200   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33201   __ret = (int16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1);
  33202   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33203   return __ret;
  33204 }
  33205 __ai __attribute__((target("neon"))) int16x4_t __noswap_vsubhn_s32(int32x4_t __p0, int32x4_t __p1) {
  33206   int16x4_t __ret;
  33207   __ret = (int16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1);
  33208   return __ret;
  33209 }
  33210 #endif
  33211 
  33212 #ifdef __LITTLE_ENDIAN__
  33213 __ai __attribute__((target("neon"))) int32x2_t vsubhn_s64(int64x2_t __p0, int64x2_t __p1) {
  33214   int32x2_t __ret;
  33215   __ret = (int32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
  33216   return __ret;
  33217 }
  33218 #else
  33219 __ai __attribute__((target("neon"))) int32x2_t vsubhn_s64(int64x2_t __p0, int64x2_t __p1) {
  33220   int32x2_t __ret;
  33221   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33222   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33223   __ret = (int32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2);
  33224   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33225   return __ret;
  33226 }
  33227 __ai __attribute__((target("neon"))) int32x2_t __noswap_vsubhn_s64(int64x2_t __p0, int64x2_t __p1) {
  33228   int32x2_t __ret;
  33229   __ret = (int32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2);
  33230   return __ret;
  33231 }
  33232 #endif
  33233 
  33234 #ifdef __LITTLE_ENDIAN__
  33235 __ai __attribute__((target("neon"))) int8x8_t vsubhn_s16(int16x8_t __p0, int16x8_t __p1) {
  33236   int8x8_t __ret;
  33237   __ret = (int8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
  33238   return __ret;
  33239 }
  33240 #else
  33241 __ai __attribute__((target("neon"))) int8x8_t vsubhn_s16(int16x8_t __p0, int16x8_t __p1) {
  33242   int8x8_t __ret;
  33243   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33244   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33245   __ret = (int8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0);
  33246   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33247   return __ret;
  33248 }
  33249 __ai __attribute__((target("neon"))) int8x8_t __noswap_vsubhn_s16(int16x8_t __p0, int16x8_t __p1) {
  33250   int8x8_t __ret;
  33251   __ret = (int8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0);
  33252   return __ret;
  33253 }
  33254 #endif
  33255 
  33256 #ifdef __LITTLE_ENDIAN__
  33257 __ai __attribute__((target("neon"))) uint16x8_t vsubl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  33258   uint16x8_t __ret;
  33259   __ret = vmovl_u8(__p0) - vmovl_u8(__p1);
  33260   return __ret;
  33261 }
  33262 #else
  33263 __ai __attribute__((target("neon"))) uint16x8_t vsubl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  33264   uint16x8_t __ret;
  33265   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33266   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33267   __ret = __noswap_vmovl_u8(__rev0) - __noswap_vmovl_u8(__rev1);
  33268   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33269   return __ret;
  33270 }
  33271 #endif
  33272 
  33273 #ifdef __LITTLE_ENDIAN__
  33274 __ai __attribute__((target("neon"))) uint64x2_t vsubl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  33275   uint64x2_t __ret;
  33276   __ret = vmovl_u32(__p0) - vmovl_u32(__p1);
  33277   return __ret;
  33278 }
  33279 #else
  33280 __ai __attribute__((target("neon"))) uint64x2_t vsubl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  33281   uint64x2_t __ret;
  33282   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33283   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33284   __ret = __noswap_vmovl_u32(__rev0) - __noswap_vmovl_u32(__rev1);
  33285   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33286   return __ret;
  33287 }
  33288 #endif
  33289 
  33290 #ifdef __LITTLE_ENDIAN__
  33291 __ai __attribute__((target("neon"))) uint32x4_t vsubl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  33292   uint32x4_t __ret;
  33293   __ret = vmovl_u16(__p0) - vmovl_u16(__p1);
  33294   return __ret;
  33295 }
  33296 #else
  33297 __ai __attribute__((target("neon"))) uint32x4_t vsubl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  33298   uint32x4_t __ret;
  33299   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33300   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33301   __ret = __noswap_vmovl_u16(__rev0) - __noswap_vmovl_u16(__rev1);
  33302   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33303   return __ret;
  33304 }
  33305 #endif
  33306 
  33307 #ifdef __LITTLE_ENDIAN__
  33308 __ai __attribute__((target("neon"))) int16x8_t vsubl_s8(int8x8_t __p0, int8x8_t __p1) {
  33309   int16x8_t __ret;
  33310   __ret = vmovl_s8(__p0) - vmovl_s8(__p1);
  33311   return __ret;
  33312 }
  33313 #else
  33314 __ai __attribute__((target("neon"))) int16x8_t vsubl_s8(int8x8_t __p0, int8x8_t __p1) {
  33315   int16x8_t __ret;
  33316   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33317   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33318   __ret = __noswap_vmovl_s8(__rev0) - __noswap_vmovl_s8(__rev1);
  33319   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33320   return __ret;
  33321 }
  33322 #endif
  33323 
  33324 #ifdef __LITTLE_ENDIAN__
  33325 __ai __attribute__((target("neon"))) int64x2_t vsubl_s32(int32x2_t __p0, int32x2_t __p1) {
  33326   int64x2_t __ret;
  33327   __ret = vmovl_s32(__p0) - vmovl_s32(__p1);
  33328   return __ret;
  33329 }
  33330 #else
  33331 __ai __attribute__((target("neon"))) int64x2_t vsubl_s32(int32x2_t __p0, int32x2_t __p1) {
  33332   int64x2_t __ret;
  33333   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33334   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33335   __ret = __noswap_vmovl_s32(__rev0) - __noswap_vmovl_s32(__rev1);
  33336   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33337   return __ret;
  33338 }
  33339 #endif
  33340 
  33341 #ifdef __LITTLE_ENDIAN__
  33342 __ai __attribute__((target("neon"))) int32x4_t vsubl_s16(int16x4_t __p0, int16x4_t __p1) {
  33343   int32x4_t __ret;
  33344   __ret = vmovl_s16(__p0) - vmovl_s16(__p1);
  33345   return __ret;
  33346 }
  33347 #else
  33348 __ai __attribute__((target("neon"))) int32x4_t vsubl_s16(int16x4_t __p0, int16x4_t __p1) {
  33349   int32x4_t __ret;
  33350   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33351   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33352   __ret = __noswap_vmovl_s16(__rev0) - __noswap_vmovl_s16(__rev1);
  33353   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33354   return __ret;
  33355 }
  33356 #endif
  33357 
  33358 #ifdef __LITTLE_ENDIAN__
  33359 __ai __attribute__((target("neon"))) uint16x8_t vsubw_u8(uint16x8_t __p0, uint8x8_t __p1) {
  33360   uint16x8_t __ret;
  33361   __ret = __p0 - vmovl_u8(__p1);
  33362   return __ret;
  33363 }
  33364 #else
  33365 __ai __attribute__((target("neon"))) uint16x8_t vsubw_u8(uint16x8_t __p0, uint8x8_t __p1) {
  33366   uint16x8_t __ret;
  33367   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33368   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33369   __ret = __rev0 - __noswap_vmovl_u8(__rev1);
  33370   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33371   return __ret;
  33372 }
  33373 #endif
  33374 
  33375 #ifdef __LITTLE_ENDIAN__
  33376 __ai __attribute__((target("neon"))) uint64x2_t vsubw_u32(uint64x2_t __p0, uint32x2_t __p1) {
  33377   uint64x2_t __ret;
  33378   __ret = __p0 - vmovl_u32(__p1);
  33379   return __ret;
  33380 }
  33381 #else
  33382 __ai __attribute__((target("neon"))) uint64x2_t vsubw_u32(uint64x2_t __p0, uint32x2_t __p1) {
  33383   uint64x2_t __ret;
  33384   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33385   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33386   __ret = __rev0 - __noswap_vmovl_u32(__rev1);
  33387   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33388   return __ret;
  33389 }
  33390 #endif
  33391 
  33392 #ifdef __LITTLE_ENDIAN__
  33393 __ai __attribute__((target("neon"))) uint32x4_t vsubw_u16(uint32x4_t __p0, uint16x4_t __p1) {
  33394   uint32x4_t __ret;
  33395   __ret = __p0 - vmovl_u16(__p1);
  33396   return __ret;
  33397 }
  33398 #else
  33399 __ai __attribute__((target("neon"))) uint32x4_t vsubw_u16(uint32x4_t __p0, uint16x4_t __p1) {
  33400   uint32x4_t __ret;
  33401   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33402   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33403   __ret = __rev0 - __noswap_vmovl_u16(__rev1);
  33404   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33405   return __ret;
  33406 }
  33407 #endif
  33408 
  33409 #ifdef __LITTLE_ENDIAN__
  33410 __ai __attribute__((target("neon"))) int16x8_t vsubw_s8(int16x8_t __p0, int8x8_t __p1) {
  33411   int16x8_t __ret;
  33412   __ret = __p0 - vmovl_s8(__p1);
  33413   return __ret;
  33414 }
  33415 #else
  33416 __ai __attribute__((target("neon"))) int16x8_t vsubw_s8(int16x8_t __p0, int8x8_t __p1) {
  33417   int16x8_t __ret;
  33418   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33419   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33420   __ret = __rev0 - __noswap_vmovl_s8(__rev1);
  33421   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33422   return __ret;
  33423 }
  33424 #endif
  33425 
  33426 #ifdef __LITTLE_ENDIAN__
  33427 __ai __attribute__((target("neon"))) int64x2_t vsubw_s32(int64x2_t __p0, int32x2_t __p1) {
  33428   int64x2_t __ret;
  33429   __ret = __p0 - vmovl_s32(__p1);
  33430   return __ret;
  33431 }
  33432 #else
  33433 __ai __attribute__((target("neon"))) int64x2_t vsubw_s32(int64x2_t __p0, int32x2_t __p1) {
  33434   int64x2_t __ret;
  33435   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  33436   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  33437   __ret = __rev0 - __noswap_vmovl_s32(__rev1);
  33438   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  33439   return __ret;
  33440 }
  33441 #endif
  33442 
  33443 #ifdef __LITTLE_ENDIAN__
  33444 __ai __attribute__((target("neon"))) int32x4_t vsubw_s16(int32x4_t __p0, int16x4_t __p1) {
  33445   int32x4_t __ret;
  33446   __ret = __p0 - vmovl_s16(__p1);
  33447   return __ret;
  33448 }
  33449 #else
  33450 __ai __attribute__((target("neon"))) int32x4_t vsubw_s16(int32x4_t __p0, int16x4_t __p1) {
  33451   int32x4_t __ret;
  33452   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33453   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33454   __ret = __rev0 - __noswap_vmovl_s16(__rev1);
  33455   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  33456   return __ret;
  33457 }
  33458 #endif
  33459 
  33460 #ifdef __LITTLE_ENDIAN__
  33461 __ai __attribute__((target("neon"))) poly8x8_t vtbl1_p8(poly8x8_t __p0, uint8x8_t __p1) {
  33462   poly8x8_t __ret;
  33463   __ret = (poly8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__p0, (int8x8_t)__p1, 4);
  33464   return __ret;
  33465 }
  33466 #else
  33467 __ai __attribute__((target("neon"))) poly8x8_t vtbl1_p8(poly8x8_t __p0, uint8x8_t __p1) {
  33468   poly8x8_t __ret;
  33469   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33470   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33471   __ret = (poly8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__rev0, (int8x8_t)__rev1, 4);
  33472   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33473   return __ret;
  33474 }
  33475 #endif
  33476 
  33477 #ifdef __LITTLE_ENDIAN__
  33478 __ai __attribute__((target("neon"))) uint8x8_t vtbl1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  33479   uint8x8_t __ret;
  33480   __ret = (uint8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  33481   return __ret;
  33482 }
  33483 #else
  33484 __ai __attribute__((target("neon"))) uint8x8_t vtbl1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  33485   uint8x8_t __ret;
  33486   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33487   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33488   __ret = (uint8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  33489   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33490   return __ret;
  33491 }
  33492 #endif
  33493 
  33494 #ifdef __LITTLE_ENDIAN__
  33495 __ai __attribute__((target("neon"))) int8x8_t vtbl1_s8(int8x8_t __p0, int8x8_t __p1) {
  33496   int8x8_t __ret;
  33497   __ret = (int8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  33498   return __ret;
  33499 }
  33500 #else
  33501 __ai __attribute__((target("neon"))) int8x8_t vtbl1_s8(int8x8_t __p0, int8x8_t __p1) {
  33502   int8x8_t __ret;
  33503   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33504   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33505   __ret = (int8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  33506   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33507   return __ret;
  33508 }
  33509 #endif
  33510 
  33511 #ifdef __LITTLE_ENDIAN__
  33512 __ai __attribute__((target("neon"))) poly8x8_t vtbl2_p8(poly8x8x2_t __p0, uint8x8_t __p1) {
  33513   poly8x8_t __ret;
  33514   __ret = (poly8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p1, 4);
  33515   return __ret;
  33516 }
  33517 #else
  33518 __ai __attribute__((target("neon"))) poly8x8_t vtbl2_p8(poly8x8x2_t __p0, uint8x8_t __p1) {
  33519   poly8x8_t __ret;
  33520   poly8x8x2_t __rev0;
  33521   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33522   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33523   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33524   __ret = (poly8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev1, 4);
  33525   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33526   return __ret;
  33527 }
  33528 #endif
  33529 
  33530 #ifdef __LITTLE_ENDIAN__
  33531 __ai __attribute__((target("neon"))) uint8x8_t vtbl2_u8(uint8x8x2_t __p0, uint8x8_t __p1) {
  33532   uint8x8_t __ret;
  33533   __ret = (uint8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p1, 16);
  33534   return __ret;
  33535 }
  33536 #else
  33537 __ai __attribute__((target("neon"))) uint8x8_t vtbl2_u8(uint8x8x2_t __p0, uint8x8_t __p1) {
  33538   uint8x8_t __ret;
  33539   uint8x8x2_t __rev0;
  33540   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33541   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33542   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33543   __ret = (uint8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev1, 16);
  33544   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33545   return __ret;
  33546 }
  33547 #endif
  33548 
  33549 #ifdef __LITTLE_ENDIAN__
  33550 __ai __attribute__((target("neon"))) int8x8_t vtbl2_s8(int8x8x2_t __p0, int8x8_t __p1) {
  33551   int8x8_t __ret;
  33552   __ret = (int8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p1, 0);
  33553   return __ret;
  33554 }
  33555 #else
  33556 __ai __attribute__((target("neon"))) int8x8_t vtbl2_s8(int8x8x2_t __p0, int8x8_t __p1) {
  33557   int8x8_t __ret;
  33558   int8x8x2_t __rev0;
  33559   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33560   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33561   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33562   __ret = (int8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev1, 0);
  33563   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33564   return __ret;
  33565 }
  33566 #endif
  33567 
  33568 #ifdef __LITTLE_ENDIAN__
  33569 __ai __attribute__((target("neon"))) poly8x8_t vtbl3_p8(poly8x8x3_t __p0, uint8x8_t __p1) {
  33570   poly8x8_t __ret;
  33571   __ret = (poly8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p1, 4);
  33572   return __ret;
  33573 }
  33574 #else
  33575 __ai __attribute__((target("neon"))) poly8x8_t vtbl3_p8(poly8x8x3_t __p0, uint8x8_t __p1) {
  33576   poly8x8_t __ret;
  33577   poly8x8x3_t __rev0;
  33578   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33579   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33580   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33581   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33582   __ret = (poly8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev1, 4);
  33583   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33584   return __ret;
  33585 }
  33586 #endif
  33587 
  33588 #ifdef __LITTLE_ENDIAN__
  33589 __ai __attribute__((target("neon"))) uint8x8_t vtbl3_u8(uint8x8x3_t __p0, uint8x8_t __p1) {
  33590   uint8x8_t __ret;
  33591   __ret = (uint8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p1, 16);
  33592   return __ret;
  33593 }
  33594 #else
  33595 __ai __attribute__((target("neon"))) uint8x8_t vtbl3_u8(uint8x8x3_t __p0, uint8x8_t __p1) {
  33596   uint8x8_t __ret;
  33597   uint8x8x3_t __rev0;
  33598   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33599   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33600   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33601   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33602   __ret = (uint8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev1, 16);
  33603   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33604   return __ret;
  33605 }
  33606 #endif
  33607 
  33608 #ifdef __LITTLE_ENDIAN__
  33609 __ai __attribute__((target("neon"))) int8x8_t vtbl3_s8(int8x8x3_t __p0, int8x8_t __p1) {
  33610   int8x8_t __ret;
  33611   __ret = (int8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p1, 0);
  33612   return __ret;
  33613 }
  33614 #else
  33615 __ai __attribute__((target("neon"))) int8x8_t vtbl3_s8(int8x8x3_t __p0, int8x8_t __p1) {
  33616   int8x8_t __ret;
  33617   int8x8x3_t __rev0;
  33618   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33619   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33620   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33621   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33622   __ret = (int8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev1, 0);
  33623   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33624   return __ret;
  33625 }
  33626 #endif
  33627 
  33628 #ifdef __LITTLE_ENDIAN__
  33629 __ai __attribute__((target("neon"))) poly8x8_t vtbl4_p8(poly8x8x4_t __p0, uint8x8_t __p1) {
  33630   poly8x8_t __ret;
  33631   __ret = (poly8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p0.val[3], (int8x8_t)__p1, 4);
  33632   return __ret;
  33633 }
  33634 #else
  33635 __ai __attribute__((target("neon"))) poly8x8_t vtbl4_p8(poly8x8x4_t __p0, uint8x8_t __p1) {
  33636   poly8x8_t __ret;
  33637   poly8x8x4_t __rev0;
  33638   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33639   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33640   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33641   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 7, 6, 5, 4, 3, 2, 1, 0);
  33642   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33643   __ret = (poly8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev0.val[3], (int8x8_t)__rev1, 4);
  33644   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33645   return __ret;
  33646 }
  33647 #endif
  33648 
  33649 #ifdef __LITTLE_ENDIAN__
  33650 __ai __attribute__((target("neon"))) uint8x8_t vtbl4_u8(uint8x8x4_t __p0, uint8x8_t __p1) {
  33651   uint8x8_t __ret;
  33652   __ret = (uint8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p0.val[3], (int8x8_t)__p1, 16);
  33653   return __ret;
  33654 }
  33655 #else
  33656 __ai __attribute__((target("neon"))) uint8x8_t vtbl4_u8(uint8x8x4_t __p0, uint8x8_t __p1) {
  33657   uint8x8_t __ret;
  33658   uint8x8x4_t __rev0;
  33659   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33660   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33661   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33662   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 7, 6, 5, 4, 3, 2, 1, 0);
  33663   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33664   __ret = (uint8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev0.val[3], (int8x8_t)__rev1, 16);
  33665   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33666   return __ret;
  33667 }
  33668 #endif
  33669 
  33670 #ifdef __LITTLE_ENDIAN__
  33671 __ai __attribute__((target("neon"))) int8x8_t vtbl4_s8(int8x8x4_t __p0, int8x8_t __p1) {
  33672   int8x8_t __ret;
  33673   __ret = (int8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p0.val[3], (int8x8_t)__p1, 0);
  33674   return __ret;
  33675 }
  33676 #else
  33677 __ai __attribute__((target("neon"))) int8x8_t vtbl4_s8(int8x8x4_t __p0, int8x8_t __p1) {
  33678   int8x8_t __ret;
  33679   int8x8x4_t __rev0;
  33680   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33681   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33682   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33683   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 7, 6, 5, 4, 3, 2, 1, 0);
  33684   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33685   __ret = (int8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev0.val[3], (int8x8_t)__rev1, 0);
  33686   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33687   return __ret;
  33688 }
  33689 #endif
  33690 
  33691 #ifdef __LITTLE_ENDIAN__
  33692 __ai __attribute__((target("neon"))) poly8x8_t vtbx1_p8(poly8x8_t __p0, poly8x8_t __p1, uint8x8_t __p2) {
  33693   poly8x8_t __ret;
  33694   __ret = (poly8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 4);
  33695   return __ret;
  33696 }
  33697 #else
  33698 __ai __attribute__((target("neon"))) poly8x8_t vtbx1_p8(poly8x8_t __p0, poly8x8_t __p1, uint8x8_t __p2) {
  33699   poly8x8_t __ret;
  33700   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33701   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33702   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33703   __ret = (poly8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 4);
  33704   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33705   return __ret;
  33706 }
  33707 #endif
  33708 
  33709 #ifdef __LITTLE_ENDIAN__
  33710 __ai __attribute__((target("neon"))) uint8x8_t vtbx1_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  33711   uint8x8_t __ret;
  33712   __ret = (uint8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 16);
  33713   return __ret;
  33714 }
  33715 #else
  33716 __ai __attribute__((target("neon"))) uint8x8_t vtbx1_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  33717   uint8x8_t __ret;
  33718   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33719   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33720   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33721   __ret = (uint8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 16);
  33722   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33723   return __ret;
  33724 }
  33725 #endif
  33726 
  33727 #ifdef __LITTLE_ENDIAN__
  33728 __ai __attribute__((target("neon"))) int8x8_t vtbx1_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  33729   int8x8_t __ret;
  33730   __ret = (int8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 0);
  33731   return __ret;
  33732 }
  33733 #else
  33734 __ai __attribute__((target("neon"))) int8x8_t vtbx1_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  33735   int8x8_t __ret;
  33736   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33737   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33738   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33739   __ret = (int8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 0);
  33740   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33741   return __ret;
  33742 }
  33743 #endif
  33744 
  33745 #ifdef __LITTLE_ENDIAN__
  33746 __ai __attribute__((target("neon"))) poly8x8_t vtbx2_p8(poly8x8_t __p0, poly8x8x2_t __p1, uint8x8_t __p2) {
  33747   poly8x8_t __ret;
  33748   __ret = (poly8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p2, 4);
  33749   return __ret;
  33750 }
  33751 #else
  33752 __ai __attribute__((target("neon"))) poly8x8_t vtbx2_p8(poly8x8_t __p0, poly8x8x2_t __p1, uint8x8_t __p2) {
  33753   poly8x8_t __ret;
  33754   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33755   poly8x8x2_t __rev1;
  33756   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33757   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33758   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33759   __ret = (poly8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev2, 4);
  33760   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33761   return __ret;
  33762 }
  33763 #endif
  33764 
  33765 #ifdef __LITTLE_ENDIAN__
  33766 __ai __attribute__((target("neon"))) uint8x8_t vtbx2_u8(uint8x8_t __p0, uint8x8x2_t __p1, uint8x8_t __p2) {
  33767   uint8x8_t __ret;
  33768   __ret = (uint8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p2, 16);
  33769   return __ret;
  33770 }
  33771 #else
  33772 __ai __attribute__((target("neon"))) uint8x8_t vtbx2_u8(uint8x8_t __p0, uint8x8x2_t __p1, uint8x8_t __p2) {
  33773   uint8x8_t __ret;
  33774   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33775   uint8x8x2_t __rev1;
  33776   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33777   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33778   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33779   __ret = (uint8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev2, 16);
  33780   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33781   return __ret;
  33782 }
  33783 #endif
  33784 
  33785 #ifdef __LITTLE_ENDIAN__
  33786 __ai __attribute__((target("neon"))) int8x8_t vtbx2_s8(int8x8_t __p0, int8x8x2_t __p1, int8x8_t __p2) {
  33787   int8x8_t __ret;
  33788   __ret = (int8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p2, 0);
  33789   return __ret;
  33790 }
  33791 #else
  33792 __ai __attribute__((target("neon"))) int8x8_t vtbx2_s8(int8x8_t __p0, int8x8x2_t __p1, int8x8_t __p2) {
  33793   int8x8_t __ret;
  33794   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33795   int8x8x2_t __rev1;
  33796   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33797   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33798   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33799   __ret = (int8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev2, 0);
  33800   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33801   return __ret;
  33802 }
  33803 #endif
  33804 
  33805 #ifdef __LITTLE_ENDIAN__
  33806 __ai __attribute__((target("neon"))) poly8x8_t vtbx3_p8(poly8x8_t __p0, poly8x8x3_t __p1, uint8x8_t __p2) {
  33807   poly8x8_t __ret;
  33808   __ret = (poly8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p2, 4);
  33809   return __ret;
  33810 }
  33811 #else
  33812 __ai __attribute__((target("neon"))) poly8x8_t vtbx3_p8(poly8x8_t __p0, poly8x8x3_t __p1, uint8x8_t __p2) {
  33813   poly8x8_t __ret;
  33814   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33815   poly8x8x3_t __rev1;
  33816   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33817   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33818   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33819   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33820   __ret = (poly8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev2, 4);
  33821   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33822   return __ret;
  33823 }
  33824 #endif
  33825 
  33826 #ifdef __LITTLE_ENDIAN__
  33827 __ai __attribute__((target("neon"))) uint8x8_t vtbx3_u8(uint8x8_t __p0, uint8x8x3_t __p1, uint8x8_t __p2) {
  33828   uint8x8_t __ret;
  33829   __ret = (uint8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p2, 16);
  33830   return __ret;
  33831 }
  33832 #else
  33833 __ai __attribute__((target("neon"))) uint8x8_t vtbx3_u8(uint8x8_t __p0, uint8x8x3_t __p1, uint8x8_t __p2) {
  33834   uint8x8_t __ret;
  33835   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33836   uint8x8x3_t __rev1;
  33837   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33838   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33839   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33840   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33841   __ret = (uint8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev2, 16);
  33842   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33843   return __ret;
  33844 }
  33845 #endif
  33846 
  33847 #ifdef __LITTLE_ENDIAN__
  33848 __ai __attribute__((target("neon"))) int8x8_t vtbx3_s8(int8x8_t __p0, int8x8x3_t __p1, int8x8_t __p2) {
  33849   int8x8_t __ret;
  33850   __ret = (int8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p2, 0);
  33851   return __ret;
  33852 }
  33853 #else
  33854 __ai __attribute__((target("neon"))) int8x8_t vtbx3_s8(int8x8_t __p0, int8x8x3_t __p1, int8x8_t __p2) {
  33855   int8x8_t __ret;
  33856   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33857   int8x8x3_t __rev1;
  33858   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33859   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33860   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33861   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33862   __ret = (int8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev2, 0);
  33863   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33864   return __ret;
  33865 }
  33866 #endif
  33867 
  33868 #ifdef __LITTLE_ENDIAN__
  33869 __ai __attribute__((target("neon"))) poly8x8_t vtbx4_p8(poly8x8_t __p0, poly8x8x4_t __p1, uint8x8_t __p2) {
  33870   poly8x8_t __ret;
  33871   __ret = (poly8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p1.val[3], (int8x8_t)__p2, 4);
  33872   return __ret;
  33873 }
  33874 #else
  33875 __ai __attribute__((target("neon"))) poly8x8_t vtbx4_p8(poly8x8_t __p0, poly8x8x4_t __p1, uint8x8_t __p2) {
  33876   poly8x8_t __ret;
  33877   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33878   poly8x8x4_t __rev1;
  33879   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33880   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33881   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33882   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 7, 6, 5, 4, 3, 2, 1, 0);
  33883   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33884   __ret = (poly8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], (int8x8_t)__rev2, 4);
  33885   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33886   return __ret;
  33887 }
  33888 #endif
  33889 
  33890 #ifdef __LITTLE_ENDIAN__
  33891 __ai __attribute__((target("neon"))) uint8x8_t vtbx4_u8(uint8x8_t __p0, uint8x8x4_t __p1, uint8x8_t __p2) {
  33892   uint8x8_t __ret;
  33893   __ret = (uint8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p1.val[3], (int8x8_t)__p2, 16);
  33894   return __ret;
  33895 }
  33896 #else
  33897 __ai __attribute__((target("neon"))) uint8x8_t vtbx4_u8(uint8x8_t __p0, uint8x8x4_t __p1, uint8x8_t __p2) {
  33898   uint8x8_t __ret;
  33899   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33900   uint8x8x4_t __rev1;
  33901   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33902   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33903   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33904   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 7, 6, 5, 4, 3, 2, 1, 0);
  33905   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33906   __ret = (uint8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], (int8x8_t)__rev2, 16);
  33907   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33908   return __ret;
  33909 }
  33910 #endif
  33911 
  33912 #ifdef __LITTLE_ENDIAN__
  33913 __ai __attribute__((target("neon"))) int8x8_t vtbx4_s8(int8x8_t __p0, int8x8x4_t __p1, int8x8_t __p2) {
  33914   int8x8_t __ret;
  33915   __ret = (int8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p1.val[3], (int8x8_t)__p2, 0);
  33916   return __ret;
  33917 }
  33918 #else
  33919 __ai __attribute__((target("neon"))) int8x8_t vtbx4_s8(int8x8_t __p0, int8x8x4_t __p1, int8x8_t __p2) {
  33920   int8x8_t __ret;
  33921   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33922   int8x8x4_t __rev1;
  33923   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33924   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33925   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0);
  33926   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 7, 6, 5, 4, 3, 2, 1, 0);
  33927   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  33928   __ret = (int8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], (int8x8_t)__rev2, 0);
  33929   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  33930   return __ret;
  33931 }
  33932 #endif
  33933 
  33934 #ifdef __LITTLE_ENDIAN__
  33935 __ai __attribute__((target("neon"))) poly8x8x2_t vtrn_p8(poly8x8_t __p0, poly8x8_t __p1) {
  33936   poly8x8x2_t __ret;
  33937   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 4);
  33938   return __ret;
  33939 }
  33940 #else
  33941 __ai __attribute__((target("neon"))) poly8x8x2_t vtrn_p8(poly8x8_t __p0, poly8x8_t __p1) {
  33942   poly8x8x2_t __ret;
  33943   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  33944   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  33945   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 4);
  33946 
  33947   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  33948   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  33949   return __ret;
  33950 }
  33951 #endif
  33952 
  33953 #ifdef __LITTLE_ENDIAN__
  33954 __ai __attribute__((target("neon"))) poly16x4x2_t vtrn_p16(poly16x4_t __p0, poly16x4_t __p1) {
  33955   poly16x4x2_t __ret;
  33956   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 5);
  33957   return __ret;
  33958 }
  33959 #else
  33960 __ai __attribute__((target("neon"))) poly16x4x2_t vtrn_p16(poly16x4_t __p0, poly16x4_t __p1) {
  33961   poly16x4x2_t __ret;
  33962   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  33963   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  33964   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 5);
  33965 
  33966   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  33967   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  33968   return __ret;
  33969 }
  33970 #endif
  33971 
  33972 #ifdef __LITTLE_ENDIAN__
  33973 __ai __attribute__((target("neon"))) poly8x16x2_t vtrnq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  33974   poly8x16x2_t __ret;
  33975   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 36);
  33976   return __ret;
  33977 }
  33978 #else
  33979 __ai __attribute__((target("neon"))) poly8x16x2_t vtrnq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  33980   poly8x16x2_t __ret;
  33981   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  33982   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  33983   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 36);
  33984 
  33985   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  33986   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  33987   return __ret;
  33988 }
  33989 #endif
  33990 
  33991 #ifdef __LITTLE_ENDIAN__
  33992 __ai __attribute__((target("neon"))) poly16x8x2_t vtrnq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  33993   poly16x8x2_t __ret;
  33994   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 37);
  33995   return __ret;
  33996 }
  33997 #else
  33998 __ai __attribute__((target("neon"))) poly16x8x2_t vtrnq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  33999   poly16x8x2_t __ret;
  34000   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34001   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34002   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 37);
  34003 
  34004   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34005   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34006   return __ret;
  34007 }
  34008 #endif
  34009 
  34010 #ifdef __LITTLE_ENDIAN__
  34011 __ai __attribute__((target("neon"))) uint8x16x2_t vtrnq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  34012   uint8x16x2_t __ret;
  34013   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 48);
  34014   return __ret;
  34015 }
  34016 #else
  34017 __ai __attribute__((target("neon"))) uint8x16x2_t vtrnq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  34018   uint8x16x2_t __ret;
  34019   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34020   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34021   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  34022 
  34023   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34024   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34025   return __ret;
  34026 }
  34027 #endif
  34028 
  34029 #ifdef __LITTLE_ENDIAN__
  34030 __ai __attribute__((target("neon"))) uint32x4x2_t vtrnq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  34031   uint32x4x2_t __ret;
  34032   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 50);
  34033   return __ret;
  34034 }
  34035 #else
  34036 __ai __attribute__((target("neon"))) uint32x4x2_t vtrnq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  34037   uint32x4x2_t __ret;
  34038   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34039   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34040   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  34041 
  34042   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34043   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34044   return __ret;
  34045 }
  34046 #endif
  34047 
  34048 #ifdef __LITTLE_ENDIAN__
  34049 __ai __attribute__((target("neon"))) uint16x8x2_t vtrnq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  34050   uint16x8x2_t __ret;
  34051   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 49);
  34052   return __ret;
  34053 }
  34054 #else
  34055 __ai __attribute__((target("neon"))) uint16x8x2_t vtrnq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  34056   uint16x8x2_t __ret;
  34057   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34058   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34059   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  34060 
  34061   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34062   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34063   return __ret;
  34064 }
  34065 #endif
  34066 
  34067 #ifdef __LITTLE_ENDIAN__
  34068 __ai __attribute__((target("neon"))) int8x16x2_t vtrnq_s8(int8x16_t __p0, int8x16_t __p1) {
  34069   int8x16x2_t __ret;
  34070   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 32);
  34071   return __ret;
  34072 }
  34073 #else
  34074 __ai __attribute__((target("neon"))) int8x16x2_t vtrnq_s8(int8x16_t __p0, int8x16_t __p1) {
  34075   int8x16x2_t __ret;
  34076   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34077   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34078   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  34079 
  34080   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34081   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34082   return __ret;
  34083 }
  34084 #endif
  34085 
  34086 #ifdef __LITTLE_ENDIAN__
  34087 __ai __attribute__((target("neon"))) float32x4x2_t vtrnq_f32(float32x4_t __p0, float32x4_t __p1) {
  34088   float32x4x2_t __ret;
  34089   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 41);
  34090   return __ret;
  34091 }
  34092 #else
  34093 __ai __attribute__((target("neon"))) float32x4x2_t vtrnq_f32(float32x4_t __p0, float32x4_t __p1) {
  34094   float32x4x2_t __ret;
  34095   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34096   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34097   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  34098 
  34099   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34100   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34101   return __ret;
  34102 }
  34103 #endif
  34104 
  34105 #ifdef __LITTLE_ENDIAN__
  34106 __ai __attribute__((target("neon"))) int32x4x2_t vtrnq_s32(int32x4_t __p0, int32x4_t __p1) {
  34107   int32x4x2_t __ret;
  34108   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 34);
  34109   return __ret;
  34110 }
  34111 #else
  34112 __ai __attribute__((target("neon"))) int32x4x2_t vtrnq_s32(int32x4_t __p0, int32x4_t __p1) {
  34113   int32x4x2_t __ret;
  34114   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34115   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34116   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  34117 
  34118   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34119   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34120   return __ret;
  34121 }
  34122 #endif
  34123 
  34124 #ifdef __LITTLE_ENDIAN__
  34125 __ai __attribute__((target("neon"))) int16x8x2_t vtrnq_s16(int16x8_t __p0, int16x8_t __p1) {
  34126   int16x8x2_t __ret;
  34127   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 33);
  34128   return __ret;
  34129 }
  34130 #else
  34131 __ai __attribute__((target("neon"))) int16x8x2_t vtrnq_s16(int16x8_t __p0, int16x8_t __p1) {
  34132   int16x8x2_t __ret;
  34133   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34134   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34135   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  34136 
  34137   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34138   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34139   return __ret;
  34140 }
  34141 #endif
  34142 
  34143 #ifdef __LITTLE_ENDIAN__
  34144 __ai __attribute__((target("neon"))) uint8x8x2_t vtrn_u8(uint8x8_t __p0, uint8x8_t __p1) {
  34145   uint8x8x2_t __ret;
  34146   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 16);
  34147   return __ret;
  34148 }
  34149 #else
  34150 __ai __attribute__((target("neon"))) uint8x8x2_t vtrn_u8(uint8x8_t __p0, uint8x8_t __p1) {
  34151   uint8x8x2_t __ret;
  34152   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34153   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34154   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  34155 
  34156   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34157   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34158   return __ret;
  34159 }
  34160 #endif
  34161 
  34162 #ifdef __LITTLE_ENDIAN__
  34163 __ai __attribute__((target("neon"))) uint32x2x2_t vtrn_u32(uint32x2_t __p0, uint32x2_t __p1) {
  34164   uint32x2x2_t __ret;
  34165   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 18);
  34166   return __ret;
  34167 }
  34168 #else
  34169 __ai __attribute__((target("neon"))) uint32x2x2_t vtrn_u32(uint32x2_t __p0, uint32x2_t __p1) {
  34170   uint32x2x2_t __ret;
  34171   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34172   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34173   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  34174 
  34175   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  34176   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  34177   return __ret;
  34178 }
  34179 #endif
  34180 
  34181 #ifdef __LITTLE_ENDIAN__
  34182 __ai __attribute__((target("neon"))) uint16x4x2_t vtrn_u16(uint16x4_t __p0, uint16x4_t __p1) {
  34183   uint16x4x2_t __ret;
  34184   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 17);
  34185   return __ret;
  34186 }
  34187 #else
  34188 __ai __attribute__((target("neon"))) uint16x4x2_t vtrn_u16(uint16x4_t __p0, uint16x4_t __p1) {
  34189   uint16x4x2_t __ret;
  34190   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34191   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34192   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  34193 
  34194   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34195   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34196   return __ret;
  34197 }
  34198 #endif
  34199 
  34200 #ifdef __LITTLE_ENDIAN__
  34201 __ai __attribute__((target("neon"))) int8x8x2_t vtrn_s8(int8x8_t __p0, int8x8_t __p1) {
  34202   int8x8x2_t __ret;
  34203   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 0);
  34204   return __ret;
  34205 }
  34206 #else
  34207 __ai __attribute__((target("neon"))) int8x8x2_t vtrn_s8(int8x8_t __p0, int8x8_t __p1) {
  34208   int8x8x2_t __ret;
  34209   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34210   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34211   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  34212 
  34213   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34214   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34215   return __ret;
  34216 }
  34217 #endif
  34218 
  34219 #ifdef __LITTLE_ENDIAN__
  34220 __ai __attribute__((target("neon"))) float32x2x2_t vtrn_f32(float32x2_t __p0, float32x2_t __p1) {
  34221   float32x2x2_t __ret;
  34222   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 9);
  34223   return __ret;
  34224 }
  34225 #else
  34226 __ai __attribute__((target("neon"))) float32x2x2_t vtrn_f32(float32x2_t __p0, float32x2_t __p1) {
  34227   float32x2x2_t __ret;
  34228   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34229   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34230   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  34231 
  34232   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  34233   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  34234   return __ret;
  34235 }
  34236 #endif
  34237 
  34238 #ifdef __LITTLE_ENDIAN__
  34239 __ai __attribute__((target("neon"))) int32x2x2_t vtrn_s32(int32x2_t __p0, int32x2_t __p1) {
  34240   int32x2x2_t __ret;
  34241   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 2);
  34242   return __ret;
  34243 }
  34244 #else
  34245 __ai __attribute__((target("neon"))) int32x2x2_t vtrn_s32(int32x2_t __p0, int32x2_t __p1) {
  34246   int32x2x2_t __ret;
  34247   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34248   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34249   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  34250 
  34251   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  34252   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  34253   return __ret;
  34254 }
  34255 #endif
  34256 
  34257 #ifdef __LITTLE_ENDIAN__
  34258 __ai __attribute__((target("neon"))) int16x4x2_t vtrn_s16(int16x4_t __p0, int16x4_t __p1) {
  34259   int16x4x2_t __ret;
  34260   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 1);
  34261   return __ret;
  34262 }
  34263 #else
  34264 __ai __attribute__((target("neon"))) int16x4x2_t vtrn_s16(int16x4_t __p0, int16x4_t __p1) {
  34265   int16x4x2_t __ret;
  34266   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34267   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34268   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  34269 
  34270   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34271   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34272   return __ret;
  34273 }
  34274 #endif
  34275 
  34276 #ifdef __LITTLE_ENDIAN__
  34277 __ai __attribute__((target("neon"))) float16x8x2_t vtrnq_f16(float16x8_t __p0, float16x8_t __p1) {
  34278   float16x8x2_t __ret;
  34279   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 40);
  34280   return __ret;
  34281 }
  34282 #else
  34283 __ai __attribute__((target("neon"))) float16x8x2_t vtrnq_f16(float16x8_t __p0, float16x8_t __p1) {
  34284   float16x8x2_t __ret;
  34285   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34286   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34287   __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  34288 
  34289   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34290   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34291   return __ret;
  34292 }
  34293 #endif
  34294 
  34295 #ifdef __LITTLE_ENDIAN__
  34296 __ai __attribute__((target("neon"))) float16x4x2_t vtrn_f16(float16x4_t __p0, float16x4_t __p1) {
  34297   float16x4x2_t __ret;
  34298   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 8);
  34299   return __ret;
  34300 }
  34301 #else
  34302 __ai __attribute__((target("neon"))) float16x4x2_t vtrn_f16(float16x4_t __p0, float16x4_t __p1) {
  34303   float16x4x2_t __ret;
  34304   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34305   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34306   __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  34307 
  34308   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34309   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34310   return __ret;
  34311 }
  34312 #endif
  34313 
  34314 #ifdef __LITTLE_ENDIAN__
  34315 __ai __attribute__((target("neon"))) uint8x8_t vtst_p8(poly8x8_t __p0, poly8x8_t __p1) {
  34316   uint8x8_t __ret;
  34317   __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  34318   return __ret;
  34319 }
  34320 #else
  34321 __ai __attribute__((target("neon"))) uint8x8_t vtst_p8(poly8x8_t __p0, poly8x8_t __p1) {
  34322   uint8x8_t __ret;
  34323   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34324   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34325   __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  34326   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  34327   return __ret;
  34328 }
  34329 #endif
  34330 
  34331 #ifdef __LITTLE_ENDIAN__
  34332 __ai __attribute__((target("neon"))) uint16x4_t vtst_p16(poly16x4_t __p0, poly16x4_t __p1) {
  34333   uint16x4_t __ret;
  34334   __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  34335   return __ret;
  34336 }
  34337 #else
  34338 __ai __attribute__((target("neon"))) uint16x4_t vtst_p16(poly16x4_t __p0, poly16x4_t __p1) {
  34339   uint16x4_t __ret;
  34340   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34341   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34342   __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  34343   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  34344   return __ret;
  34345 }
  34346 #endif
  34347 
  34348 #ifdef __LITTLE_ENDIAN__
  34349 __ai __attribute__((target("neon"))) uint8x16_t vtstq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  34350   uint8x16_t __ret;
  34351   __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  34352   return __ret;
  34353 }
  34354 #else
  34355 __ai __attribute__((target("neon"))) uint8x16_t vtstq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  34356   uint8x16_t __ret;
  34357   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34358   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34359   __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  34360   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34361   return __ret;
  34362 }
  34363 #endif
  34364 
  34365 #ifdef __LITTLE_ENDIAN__
  34366 __ai __attribute__((target("neon"))) uint16x8_t vtstq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  34367   uint16x8_t __ret;
  34368   __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  34369   return __ret;
  34370 }
  34371 #else
  34372 __ai __attribute__((target("neon"))) uint16x8_t vtstq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  34373   uint16x8_t __ret;
  34374   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34375   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34376   __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  34377   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  34378   return __ret;
  34379 }
  34380 #endif
  34381 
  34382 #ifdef __LITTLE_ENDIAN__
  34383 __ai __attribute__((target("neon"))) uint8x16_t vtstq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  34384   uint8x16_t __ret;
  34385   __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  34386   return __ret;
  34387 }
  34388 #else
  34389 __ai __attribute__((target("neon"))) uint8x16_t vtstq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  34390   uint8x16_t __ret;
  34391   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34392   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34393   __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  34394   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34395   return __ret;
  34396 }
  34397 #endif
  34398 
  34399 #ifdef __LITTLE_ENDIAN__
  34400 __ai __attribute__((target("neon"))) uint32x4_t vtstq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  34401   uint32x4_t __ret;
  34402   __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  34403   return __ret;
  34404 }
  34405 #else
  34406 __ai __attribute__((target("neon"))) uint32x4_t vtstq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  34407   uint32x4_t __ret;
  34408   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34409   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34410   __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  34411   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  34412   return __ret;
  34413 }
  34414 #endif
  34415 
  34416 #ifdef __LITTLE_ENDIAN__
  34417 __ai __attribute__((target("neon"))) uint16x8_t vtstq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  34418   uint16x8_t __ret;
  34419   __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  34420   return __ret;
  34421 }
  34422 #else
  34423 __ai __attribute__((target("neon"))) uint16x8_t vtstq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  34424   uint16x8_t __ret;
  34425   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34426   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34427   __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  34428   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  34429   return __ret;
  34430 }
  34431 #endif
  34432 
  34433 #ifdef __LITTLE_ENDIAN__
  34434 __ai __attribute__((target("neon"))) uint8x16_t vtstq_s8(int8x16_t __p0, int8x16_t __p1) {
  34435   uint8x16_t __ret;
  34436   __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  34437   return __ret;
  34438 }
  34439 #else
  34440 __ai __attribute__((target("neon"))) uint8x16_t vtstq_s8(int8x16_t __p0, int8x16_t __p1) {
  34441   uint8x16_t __ret;
  34442   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34443   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34444   __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  34445   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34446   return __ret;
  34447 }
  34448 #endif
  34449 
  34450 #ifdef __LITTLE_ENDIAN__
  34451 __ai __attribute__((target("neon"))) uint32x4_t vtstq_s32(int32x4_t __p0, int32x4_t __p1) {
  34452   uint32x4_t __ret;
  34453   __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  34454   return __ret;
  34455 }
  34456 #else
  34457 __ai __attribute__((target("neon"))) uint32x4_t vtstq_s32(int32x4_t __p0, int32x4_t __p1) {
  34458   uint32x4_t __ret;
  34459   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34460   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34461   __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  34462   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  34463   return __ret;
  34464 }
  34465 #endif
  34466 
  34467 #ifdef __LITTLE_ENDIAN__
  34468 __ai __attribute__((target("neon"))) uint16x8_t vtstq_s16(int16x8_t __p0, int16x8_t __p1) {
  34469   uint16x8_t __ret;
  34470   __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  34471   return __ret;
  34472 }
  34473 #else
  34474 __ai __attribute__((target("neon"))) uint16x8_t vtstq_s16(int16x8_t __p0, int16x8_t __p1) {
  34475   uint16x8_t __ret;
  34476   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34477   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34478   __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  34479   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  34480   return __ret;
  34481 }
  34482 #endif
  34483 
  34484 #ifdef __LITTLE_ENDIAN__
  34485 __ai __attribute__((target("neon"))) uint8x8_t vtst_u8(uint8x8_t __p0, uint8x8_t __p1) {
  34486   uint8x8_t __ret;
  34487   __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  34488   return __ret;
  34489 }
  34490 #else
  34491 __ai __attribute__((target("neon"))) uint8x8_t vtst_u8(uint8x8_t __p0, uint8x8_t __p1) {
  34492   uint8x8_t __ret;
  34493   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34494   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34495   __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  34496   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  34497   return __ret;
  34498 }
  34499 #endif
  34500 
  34501 #ifdef __LITTLE_ENDIAN__
  34502 __ai __attribute__((target("neon"))) uint32x2_t vtst_u32(uint32x2_t __p0, uint32x2_t __p1) {
  34503   uint32x2_t __ret;
  34504   __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  34505   return __ret;
  34506 }
  34507 #else
  34508 __ai __attribute__((target("neon"))) uint32x2_t vtst_u32(uint32x2_t __p0, uint32x2_t __p1) {
  34509   uint32x2_t __ret;
  34510   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34511   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34512   __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  34513   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  34514   return __ret;
  34515 }
  34516 #endif
  34517 
  34518 #ifdef __LITTLE_ENDIAN__
  34519 __ai __attribute__((target("neon"))) uint16x4_t vtst_u16(uint16x4_t __p0, uint16x4_t __p1) {
  34520   uint16x4_t __ret;
  34521   __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  34522   return __ret;
  34523 }
  34524 #else
  34525 __ai __attribute__((target("neon"))) uint16x4_t vtst_u16(uint16x4_t __p0, uint16x4_t __p1) {
  34526   uint16x4_t __ret;
  34527   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34528   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34529   __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  34530   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  34531   return __ret;
  34532 }
  34533 #endif
  34534 
  34535 #ifdef __LITTLE_ENDIAN__
  34536 __ai __attribute__((target("neon"))) uint8x8_t vtst_s8(int8x8_t __p0, int8x8_t __p1) {
  34537   uint8x8_t __ret;
  34538   __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  34539   return __ret;
  34540 }
  34541 #else
  34542 __ai __attribute__((target("neon"))) uint8x8_t vtst_s8(int8x8_t __p0, int8x8_t __p1) {
  34543   uint8x8_t __ret;
  34544   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34545   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34546   __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  34547   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  34548   return __ret;
  34549 }
  34550 #endif
  34551 
  34552 #ifdef __LITTLE_ENDIAN__
  34553 __ai __attribute__((target("neon"))) uint32x2_t vtst_s32(int32x2_t __p0, int32x2_t __p1) {
  34554   uint32x2_t __ret;
  34555   __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  34556   return __ret;
  34557 }
  34558 #else
  34559 __ai __attribute__((target("neon"))) uint32x2_t vtst_s32(int32x2_t __p0, int32x2_t __p1) {
  34560   uint32x2_t __ret;
  34561   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34562   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34563   __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  34564   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  34565   return __ret;
  34566 }
  34567 #endif
  34568 
  34569 #ifdef __LITTLE_ENDIAN__
  34570 __ai __attribute__((target("neon"))) uint16x4_t vtst_s16(int16x4_t __p0, int16x4_t __p1) {
  34571   uint16x4_t __ret;
  34572   __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  34573   return __ret;
  34574 }
  34575 #else
  34576 __ai __attribute__((target("neon"))) uint16x4_t vtst_s16(int16x4_t __p0, int16x4_t __p1) {
  34577   uint16x4_t __ret;
  34578   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34579   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34580   __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  34581   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  34582   return __ret;
  34583 }
  34584 #endif
  34585 
  34586 #ifdef __LITTLE_ENDIAN__
  34587 __ai __attribute__((target("neon"))) poly8x8x2_t vuzp_p8(poly8x8_t __p0, poly8x8_t __p1) {
  34588   poly8x8x2_t __ret;
  34589   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 4);
  34590   return __ret;
  34591 }
  34592 #else
  34593 __ai __attribute__((target("neon"))) poly8x8x2_t vuzp_p8(poly8x8_t __p0, poly8x8_t __p1) {
  34594   poly8x8x2_t __ret;
  34595   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34596   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34597   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 4);
  34598 
  34599   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34600   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34601   return __ret;
  34602 }
  34603 #endif
  34604 
  34605 #ifdef __LITTLE_ENDIAN__
  34606 __ai __attribute__((target("neon"))) poly16x4x2_t vuzp_p16(poly16x4_t __p0, poly16x4_t __p1) {
  34607   poly16x4x2_t __ret;
  34608   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 5);
  34609   return __ret;
  34610 }
  34611 #else
  34612 __ai __attribute__((target("neon"))) poly16x4x2_t vuzp_p16(poly16x4_t __p0, poly16x4_t __p1) {
  34613   poly16x4x2_t __ret;
  34614   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34615   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34616   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 5);
  34617 
  34618   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34619   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34620   return __ret;
  34621 }
  34622 #endif
  34623 
  34624 #ifdef __LITTLE_ENDIAN__
  34625 __ai __attribute__((target("neon"))) poly8x16x2_t vuzpq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  34626   poly8x16x2_t __ret;
  34627   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 36);
  34628   return __ret;
  34629 }
  34630 #else
  34631 __ai __attribute__((target("neon"))) poly8x16x2_t vuzpq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  34632   poly8x16x2_t __ret;
  34633   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34634   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34635   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 36);
  34636 
  34637   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34638   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34639   return __ret;
  34640 }
  34641 #endif
  34642 
  34643 #ifdef __LITTLE_ENDIAN__
  34644 __ai __attribute__((target("neon"))) poly16x8x2_t vuzpq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  34645   poly16x8x2_t __ret;
  34646   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 37);
  34647   return __ret;
  34648 }
  34649 #else
  34650 __ai __attribute__((target("neon"))) poly16x8x2_t vuzpq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  34651   poly16x8x2_t __ret;
  34652   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34653   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34654   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 37);
  34655 
  34656   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34657   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34658   return __ret;
  34659 }
  34660 #endif
  34661 
  34662 #ifdef __LITTLE_ENDIAN__
  34663 __ai __attribute__((target("neon"))) uint8x16x2_t vuzpq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  34664   uint8x16x2_t __ret;
  34665   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 48);
  34666   return __ret;
  34667 }
  34668 #else
  34669 __ai __attribute__((target("neon"))) uint8x16x2_t vuzpq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  34670   uint8x16x2_t __ret;
  34671   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34672   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34673   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  34674 
  34675   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34676   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34677   return __ret;
  34678 }
  34679 #endif
  34680 
  34681 #ifdef __LITTLE_ENDIAN__
  34682 __ai __attribute__((target("neon"))) uint32x4x2_t vuzpq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  34683   uint32x4x2_t __ret;
  34684   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 50);
  34685   return __ret;
  34686 }
  34687 #else
  34688 __ai __attribute__((target("neon"))) uint32x4x2_t vuzpq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  34689   uint32x4x2_t __ret;
  34690   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34691   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34692   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  34693 
  34694   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34695   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34696   return __ret;
  34697 }
  34698 #endif
  34699 
  34700 #ifdef __LITTLE_ENDIAN__
  34701 __ai __attribute__((target("neon"))) uint16x8x2_t vuzpq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  34702   uint16x8x2_t __ret;
  34703   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 49);
  34704   return __ret;
  34705 }
  34706 #else
  34707 __ai __attribute__((target("neon"))) uint16x8x2_t vuzpq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  34708   uint16x8x2_t __ret;
  34709   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34710   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34711   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  34712 
  34713   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34714   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34715   return __ret;
  34716 }
  34717 #endif
  34718 
  34719 #ifdef __LITTLE_ENDIAN__
  34720 __ai __attribute__((target("neon"))) int8x16x2_t vuzpq_s8(int8x16_t __p0, int8x16_t __p1) {
  34721   int8x16x2_t __ret;
  34722   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 32);
  34723   return __ret;
  34724 }
  34725 #else
  34726 __ai __attribute__((target("neon"))) int8x16x2_t vuzpq_s8(int8x16_t __p0, int8x16_t __p1) {
  34727   int8x16x2_t __ret;
  34728   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34729   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34730   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  34731 
  34732   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34733   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  34734   return __ret;
  34735 }
  34736 #endif
  34737 
  34738 #ifdef __LITTLE_ENDIAN__
  34739 __ai __attribute__((target("neon"))) float32x4x2_t vuzpq_f32(float32x4_t __p0, float32x4_t __p1) {
  34740   float32x4x2_t __ret;
  34741   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 41);
  34742   return __ret;
  34743 }
  34744 #else
  34745 __ai __attribute__((target("neon"))) float32x4x2_t vuzpq_f32(float32x4_t __p0, float32x4_t __p1) {
  34746   float32x4x2_t __ret;
  34747   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34748   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34749   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  34750 
  34751   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34752   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34753   return __ret;
  34754 }
  34755 #endif
  34756 
  34757 #ifdef __LITTLE_ENDIAN__
  34758 __ai __attribute__((target("neon"))) int32x4x2_t vuzpq_s32(int32x4_t __p0, int32x4_t __p1) {
  34759   int32x4x2_t __ret;
  34760   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 34);
  34761   return __ret;
  34762 }
  34763 #else
  34764 __ai __attribute__((target("neon"))) int32x4x2_t vuzpq_s32(int32x4_t __p0, int32x4_t __p1) {
  34765   int32x4x2_t __ret;
  34766   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34767   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34768   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  34769 
  34770   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34771   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34772   return __ret;
  34773 }
  34774 #endif
  34775 
  34776 #ifdef __LITTLE_ENDIAN__
  34777 __ai __attribute__((target("neon"))) int16x8x2_t vuzpq_s16(int16x8_t __p0, int16x8_t __p1) {
  34778   int16x8x2_t __ret;
  34779   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 33);
  34780   return __ret;
  34781 }
  34782 #else
  34783 __ai __attribute__((target("neon"))) int16x8x2_t vuzpq_s16(int16x8_t __p0, int16x8_t __p1) {
  34784   int16x8x2_t __ret;
  34785   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34786   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34787   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  34788 
  34789   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34790   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34791   return __ret;
  34792 }
  34793 #endif
  34794 
  34795 #ifdef __LITTLE_ENDIAN__
  34796 __ai __attribute__((target("neon"))) uint8x8x2_t vuzp_u8(uint8x8_t __p0, uint8x8_t __p1) {
  34797   uint8x8x2_t __ret;
  34798   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 16);
  34799   return __ret;
  34800 }
  34801 #else
  34802 __ai __attribute__((target("neon"))) uint8x8x2_t vuzp_u8(uint8x8_t __p0, uint8x8_t __p1) {
  34803   uint8x8x2_t __ret;
  34804   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34805   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34806   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  34807 
  34808   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34809   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34810   return __ret;
  34811 }
  34812 #endif
  34813 
  34814 #ifdef __LITTLE_ENDIAN__
  34815 __ai __attribute__((target("neon"))) uint32x2x2_t vuzp_u32(uint32x2_t __p0, uint32x2_t __p1) {
  34816   uint32x2x2_t __ret;
  34817   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 18);
  34818   return __ret;
  34819 }
  34820 #else
  34821 __ai __attribute__((target("neon"))) uint32x2x2_t vuzp_u32(uint32x2_t __p0, uint32x2_t __p1) {
  34822   uint32x2x2_t __ret;
  34823   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34824   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34825   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  34826 
  34827   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  34828   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  34829   return __ret;
  34830 }
  34831 #endif
  34832 
  34833 #ifdef __LITTLE_ENDIAN__
  34834 __ai __attribute__((target("neon"))) uint16x4x2_t vuzp_u16(uint16x4_t __p0, uint16x4_t __p1) {
  34835   uint16x4x2_t __ret;
  34836   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 17);
  34837   return __ret;
  34838 }
  34839 #else
  34840 __ai __attribute__((target("neon"))) uint16x4x2_t vuzp_u16(uint16x4_t __p0, uint16x4_t __p1) {
  34841   uint16x4x2_t __ret;
  34842   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34843   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34844   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  34845 
  34846   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34847   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34848   return __ret;
  34849 }
  34850 #endif
  34851 
  34852 #ifdef __LITTLE_ENDIAN__
  34853 __ai __attribute__((target("neon"))) int8x8x2_t vuzp_s8(int8x8_t __p0, int8x8_t __p1) {
  34854   int8x8x2_t __ret;
  34855   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 0);
  34856   return __ret;
  34857 }
  34858 #else
  34859 __ai __attribute__((target("neon"))) int8x8x2_t vuzp_s8(int8x8_t __p0, int8x8_t __p1) {
  34860   int8x8x2_t __ret;
  34861   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34862   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34863   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  34864 
  34865   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34866   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34867   return __ret;
  34868 }
  34869 #endif
  34870 
  34871 #ifdef __LITTLE_ENDIAN__
  34872 __ai __attribute__((target("neon"))) float32x2x2_t vuzp_f32(float32x2_t __p0, float32x2_t __p1) {
  34873   float32x2x2_t __ret;
  34874   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 9);
  34875   return __ret;
  34876 }
  34877 #else
  34878 __ai __attribute__((target("neon"))) float32x2x2_t vuzp_f32(float32x2_t __p0, float32x2_t __p1) {
  34879   float32x2x2_t __ret;
  34880   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34881   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34882   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  34883 
  34884   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  34885   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  34886   return __ret;
  34887 }
  34888 #endif
  34889 
  34890 #ifdef __LITTLE_ENDIAN__
  34891 __ai __attribute__((target("neon"))) int32x2x2_t vuzp_s32(int32x2_t __p0, int32x2_t __p1) {
  34892   int32x2x2_t __ret;
  34893   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 2);
  34894   return __ret;
  34895 }
  34896 #else
  34897 __ai __attribute__((target("neon"))) int32x2x2_t vuzp_s32(int32x2_t __p0, int32x2_t __p1) {
  34898   int32x2x2_t __ret;
  34899   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  34900   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  34901   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  34902 
  34903   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  34904   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  34905   return __ret;
  34906 }
  34907 #endif
  34908 
  34909 #ifdef __LITTLE_ENDIAN__
  34910 __ai __attribute__((target("neon"))) int16x4x2_t vuzp_s16(int16x4_t __p0, int16x4_t __p1) {
  34911   int16x4x2_t __ret;
  34912   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 1);
  34913   return __ret;
  34914 }
  34915 #else
  34916 __ai __attribute__((target("neon"))) int16x4x2_t vuzp_s16(int16x4_t __p0, int16x4_t __p1) {
  34917   int16x4x2_t __ret;
  34918   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34919   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34920   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  34921 
  34922   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34923   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34924   return __ret;
  34925 }
  34926 #endif
  34927 
  34928 #ifdef __LITTLE_ENDIAN__
  34929 __ai __attribute__((target("neon"))) float16x8x2_t vuzpq_f16(float16x8_t __p0, float16x8_t __p1) {
  34930   float16x8x2_t __ret;
  34931   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 40);
  34932   return __ret;
  34933 }
  34934 #else
  34935 __ai __attribute__((target("neon"))) float16x8x2_t vuzpq_f16(float16x8_t __p0, float16x8_t __p1) {
  34936   float16x8x2_t __ret;
  34937   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34938   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34939   __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  34940 
  34941   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34942   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34943   return __ret;
  34944 }
  34945 #endif
  34946 
  34947 #ifdef __LITTLE_ENDIAN__
  34948 __ai __attribute__((target("neon"))) float16x4x2_t vuzp_f16(float16x4_t __p0, float16x4_t __p1) {
  34949   float16x4x2_t __ret;
  34950   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 8);
  34951   return __ret;
  34952 }
  34953 #else
  34954 __ai __attribute__((target("neon"))) float16x4x2_t vuzp_f16(float16x4_t __p0, float16x4_t __p1) {
  34955   float16x4x2_t __ret;
  34956   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34957   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34958   __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  34959 
  34960   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34961   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  34962   return __ret;
  34963 }
  34964 #endif
  34965 
  34966 #ifdef __LITTLE_ENDIAN__
  34967 __ai __attribute__((target("neon"))) poly8x8x2_t vzip_p8(poly8x8_t __p0, poly8x8_t __p1) {
  34968   poly8x8x2_t __ret;
  34969   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 4);
  34970   return __ret;
  34971 }
  34972 #else
  34973 __ai __attribute__((target("neon"))) poly8x8x2_t vzip_p8(poly8x8_t __p0, poly8x8_t __p1) {
  34974   poly8x8x2_t __ret;
  34975   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  34976   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  34977   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 4);
  34978 
  34979   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  34980   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  34981   return __ret;
  34982 }
  34983 #endif
  34984 
  34985 #ifdef __LITTLE_ENDIAN__
  34986 __ai __attribute__((target("neon"))) poly16x4x2_t vzip_p16(poly16x4_t __p0, poly16x4_t __p1) {
  34987   poly16x4x2_t __ret;
  34988   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 5);
  34989   return __ret;
  34990 }
  34991 #else
  34992 __ai __attribute__((target("neon"))) poly16x4x2_t vzip_p16(poly16x4_t __p0, poly16x4_t __p1) {
  34993   poly16x4x2_t __ret;
  34994   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  34995   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  34996   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 5);
  34997 
  34998   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  34999   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35000   return __ret;
  35001 }
  35002 #endif
  35003 
  35004 #ifdef __LITTLE_ENDIAN__
  35005 __ai __attribute__((target("neon"))) poly8x16x2_t vzipq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  35006   poly8x16x2_t __ret;
  35007   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 36);
  35008   return __ret;
  35009 }
  35010 #else
  35011 __ai __attribute__((target("neon"))) poly8x16x2_t vzipq_p8(poly8x16_t __p0, poly8x16_t __p1) {
  35012   poly8x16x2_t __ret;
  35013   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35014   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35015   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 36);
  35016 
  35017   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35018   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35019   return __ret;
  35020 }
  35021 #endif
  35022 
  35023 #ifdef __LITTLE_ENDIAN__
  35024 __ai __attribute__((target("neon"))) poly16x8x2_t vzipq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  35025   poly16x8x2_t __ret;
  35026   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 37);
  35027   return __ret;
  35028 }
  35029 #else
  35030 __ai __attribute__((target("neon"))) poly16x8x2_t vzipq_p16(poly16x8_t __p0, poly16x8_t __p1) {
  35031   poly16x8x2_t __ret;
  35032   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35033   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35034   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 37);
  35035 
  35036   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  35037   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  35038   return __ret;
  35039 }
  35040 #endif
  35041 
  35042 #ifdef __LITTLE_ENDIAN__
  35043 __ai __attribute__((target("neon"))) uint8x16x2_t vzipq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  35044   uint8x16x2_t __ret;
  35045   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 48);
  35046   return __ret;
  35047 }
  35048 #else
  35049 __ai __attribute__((target("neon"))) uint8x16x2_t vzipq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  35050   uint8x16x2_t __ret;
  35051   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35052   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35053   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  35054 
  35055   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35056   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35057   return __ret;
  35058 }
  35059 #endif
  35060 
  35061 #ifdef __LITTLE_ENDIAN__
  35062 __ai __attribute__((target("neon"))) uint32x4x2_t vzipq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  35063   uint32x4x2_t __ret;
  35064   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 50);
  35065   return __ret;
  35066 }
  35067 #else
  35068 __ai __attribute__((target("neon"))) uint32x4x2_t vzipq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  35069   uint32x4x2_t __ret;
  35070   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35071   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35072   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  35073 
  35074   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  35075   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35076   return __ret;
  35077 }
  35078 #endif
  35079 
  35080 #ifdef __LITTLE_ENDIAN__
  35081 __ai __attribute__((target("neon"))) uint16x8x2_t vzipq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  35082   uint16x8x2_t __ret;
  35083   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 49);
  35084   return __ret;
  35085 }
  35086 #else
  35087 __ai __attribute__((target("neon"))) uint16x8x2_t vzipq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  35088   uint16x8x2_t __ret;
  35089   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35090   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35091   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  35092 
  35093   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  35094   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  35095   return __ret;
  35096 }
  35097 #endif
  35098 
  35099 #ifdef __LITTLE_ENDIAN__
  35100 __ai __attribute__((target("neon"))) int8x16x2_t vzipq_s8(int8x16_t __p0, int8x16_t __p1) {
  35101   int8x16x2_t __ret;
  35102   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 32);
  35103   return __ret;
  35104 }
  35105 #else
  35106 __ai __attribute__((target("neon"))) int8x16x2_t vzipq_s8(int8x16_t __p0, int8x16_t __p1) {
  35107   int8x16x2_t __ret;
  35108   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35109   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35110   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  35111 
  35112   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35113   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  35114   return __ret;
  35115 }
  35116 #endif
  35117 
  35118 #ifdef __LITTLE_ENDIAN__
  35119 __ai __attribute__((target("neon"))) float32x4x2_t vzipq_f32(float32x4_t __p0, float32x4_t __p1) {
  35120   float32x4x2_t __ret;
  35121   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 41);
  35122   return __ret;
  35123 }
  35124 #else
  35125 __ai __attribute__((target("neon"))) float32x4x2_t vzipq_f32(float32x4_t __p0, float32x4_t __p1) {
  35126   float32x4x2_t __ret;
  35127   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35128   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35129   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  35130 
  35131   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  35132   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35133   return __ret;
  35134 }
  35135 #endif
  35136 
  35137 #ifdef __LITTLE_ENDIAN__
  35138 __ai __attribute__((target("neon"))) int32x4x2_t vzipq_s32(int32x4_t __p0, int32x4_t __p1) {
  35139   int32x4x2_t __ret;
  35140   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 34);
  35141   return __ret;
  35142 }
  35143 #else
  35144 __ai __attribute__((target("neon"))) int32x4x2_t vzipq_s32(int32x4_t __p0, int32x4_t __p1) {
  35145   int32x4x2_t __ret;
  35146   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35147   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35148   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  35149 
  35150   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  35151   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35152   return __ret;
  35153 }
  35154 #endif
  35155 
  35156 #ifdef __LITTLE_ENDIAN__
  35157 __ai __attribute__((target("neon"))) int16x8x2_t vzipq_s16(int16x8_t __p0, int16x8_t __p1) {
  35158   int16x8x2_t __ret;
  35159   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 33);
  35160   return __ret;
  35161 }
  35162 #else
  35163 __ai __attribute__((target("neon"))) int16x8x2_t vzipq_s16(int16x8_t __p0, int16x8_t __p1) {
  35164   int16x8x2_t __ret;
  35165   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35166   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35167   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  35168 
  35169   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  35170   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  35171   return __ret;
  35172 }
  35173 #endif
  35174 
  35175 #ifdef __LITTLE_ENDIAN__
  35176 __ai __attribute__((target("neon"))) uint8x8x2_t vzip_u8(uint8x8_t __p0, uint8x8_t __p1) {
  35177   uint8x8x2_t __ret;
  35178   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 16);
  35179   return __ret;
  35180 }
  35181 #else
  35182 __ai __attribute__((target("neon"))) uint8x8x2_t vzip_u8(uint8x8_t __p0, uint8x8_t __p1) {
  35183   uint8x8x2_t __ret;
  35184   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35185   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35186   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  35187 
  35188   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  35189   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  35190   return __ret;
  35191 }
  35192 #endif
  35193 
  35194 #ifdef __LITTLE_ENDIAN__
  35195 __ai __attribute__((target("neon"))) uint32x2x2_t vzip_u32(uint32x2_t __p0, uint32x2_t __p1) {
  35196   uint32x2x2_t __ret;
  35197   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 18);
  35198   return __ret;
  35199 }
  35200 #else
  35201 __ai __attribute__((target("neon"))) uint32x2x2_t vzip_u32(uint32x2_t __p0, uint32x2_t __p1) {
  35202   uint32x2x2_t __ret;
  35203   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  35204   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  35205   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  35206 
  35207   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  35208   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  35209   return __ret;
  35210 }
  35211 #endif
  35212 
  35213 #ifdef __LITTLE_ENDIAN__
  35214 __ai __attribute__((target("neon"))) uint16x4x2_t vzip_u16(uint16x4_t __p0, uint16x4_t __p1) {
  35215   uint16x4x2_t __ret;
  35216   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 17);
  35217   return __ret;
  35218 }
  35219 #else
  35220 __ai __attribute__((target("neon"))) uint16x4x2_t vzip_u16(uint16x4_t __p0, uint16x4_t __p1) {
  35221   uint16x4x2_t __ret;
  35222   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35223   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35224   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  35225 
  35226   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  35227   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35228   return __ret;
  35229 }
  35230 #endif
  35231 
  35232 #ifdef __LITTLE_ENDIAN__
  35233 __ai __attribute__((target("neon"))) int8x8x2_t vzip_s8(int8x8_t __p0, int8x8_t __p1) {
  35234   int8x8x2_t __ret;
  35235   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 0);
  35236   return __ret;
  35237 }
  35238 #else
  35239 __ai __attribute__((target("neon"))) int8x8x2_t vzip_s8(int8x8_t __p0, int8x8_t __p1) {
  35240   int8x8x2_t __ret;
  35241   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35242   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35243   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  35244 
  35245   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  35246   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  35247   return __ret;
  35248 }
  35249 #endif
  35250 
  35251 #ifdef __LITTLE_ENDIAN__
  35252 __ai __attribute__((target("neon"))) float32x2x2_t vzip_f32(float32x2_t __p0, float32x2_t __p1) {
  35253   float32x2x2_t __ret;
  35254   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 9);
  35255   return __ret;
  35256 }
  35257 #else
  35258 __ai __attribute__((target("neon"))) float32x2x2_t vzip_f32(float32x2_t __p0, float32x2_t __p1) {
  35259   float32x2x2_t __ret;
  35260   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  35261   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  35262   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  35263 
  35264   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  35265   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  35266   return __ret;
  35267 }
  35268 #endif
  35269 
  35270 #ifdef __LITTLE_ENDIAN__
  35271 __ai __attribute__((target("neon"))) int32x2x2_t vzip_s32(int32x2_t __p0, int32x2_t __p1) {
  35272   int32x2x2_t __ret;
  35273   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 2);
  35274   return __ret;
  35275 }
  35276 #else
  35277 __ai __attribute__((target("neon"))) int32x2x2_t vzip_s32(int32x2_t __p0, int32x2_t __p1) {
  35278   int32x2x2_t __ret;
  35279   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  35280   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  35281   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  35282 
  35283   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0);
  35284   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0);
  35285   return __ret;
  35286 }
  35287 #endif
  35288 
  35289 #ifdef __LITTLE_ENDIAN__
  35290 __ai __attribute__((target("neon"))) int16x4x2_t vzip_s16(int16x4_t __p0, int16x4_t __p1) {
  35291   int16x4x2_t __ret;
  35292   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 1);
  35293   return __ret;
  35294 }
  35295 #else
  35296 __ai __attribute__((target("neon"))) int16x4x2_t vzip_s16(int16x4_t __p0, int16x4_t __p1) {
  35297   int16x4x2_t __ret;
  35298   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35299   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35300   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  35301 
  35302   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  35303   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35304   return __ret;
  35305 }
  35306 #endif
  35307 
  35308 #ifdef __LITTLE_ENDIAN__
  35309 __ai __attribute__((target("neon"))) float16x8x2_t vzipq_f16(float16x8_t __p0, float16x8_t __p1) {
  35310   float16x8x2_t __ret;
  35311   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 40);
  35312   return __ret;
  35313 }
  35314 #else
  35315 __ai __attribute__((target("neon"))) float16x8x2_t vzipq_f16(float16x8_t __p0, float16x8_t __p1) {
  35316   float16x8x2_t __ret;
  35317   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35318   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35319   __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  35320 
  35321   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0);
  35322   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0);
  35323   return __ret;
  35324 }
  35325 #endif
  35326 
  35327 #ifdef __LITTLE_ENDIAN__
  35328 __ai __attribute__((target("neon"))) float16x4x2_t vzip_f16(float16x4_t __p0, float16x4_t __p1) {
  35329   float16x4x2_t __ret;
  35330   __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 8);
  35331   return __ret;
  35332 }
  35333 #else
  35334 __ai __attribute__((target("neon"))) float16x4x2_t vzip_f16(float16x4_t __p0, float16x4_t __p1) {
  35335   float16x4x2_t __ret;
  35336   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35337   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35338   __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  35339 
  35340   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0);
  35341   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0);
  35342   return __ret;
  35343 }
  35344 #endif
  35345 
  35346 #ifdef __LITTLE_ENDIAN__
  35347 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlahq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  35348   int32x4_t __ret;
  35349   __ret = (int32x4_t) __builtin_neon_vqrdmlahq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
  35350   return __ret;
  35351 }
  35352 #else
  35353 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlahq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  35354   int32x4_t __ret;
  35355   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35356   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35357   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  35358   __ret = (int32x4_t) __builtin_neon_vqrdmlahq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
  35359   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35360   return __ret;
  35361 }
  35362 __ai __attribute__((target("v8.1a,neon"))) int32x4_t __noswap_vqrdmlahq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  35363   int32x4_t __ret;
  35364   __ret = (int32x4_t) __builtin_neon_vqrdmlahq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
  35365   return __ret;
  35366 }
  35367 #endif
  35368 
  35369 #ifdef __LITTLE_ENDIAN__
  35370 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlahq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  35371   int16x8_t __ret;
  35372   __ret = (int16x8_t) __builtin_neon_vqrdmlahq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
  35373   return __ret;
  35374 }
  35375 #else
  35376 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlahq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  35377   int16x8_t __ret;
  35378   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35379   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35380   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  35381   __ret = (int16x8_t) __builtin_neon_vqrdmlahq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33);
  35382   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  35383   return __ret;
  35384 }
  35385 __ai __attribute__((target("v8.1a,neon"))) int16x8_t __noswap_vqrdmlahq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  35386   int16x8_t __ret;
  35387   __ret = (int16x8_t) __builtin_neon_vqrdmlahq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
  35388   return __ret;
  35389 }
  35390 #endif
  35391 
  35392 #ifdef __LITTLE_ENDIAN__
  35393 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlah_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  35394   int32x2_t __ret;
  35395   __ret = (int32x2_t) __builtin_neon_vqrdmlah_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
  35396   return __ret;
  35397 }
  35398 #else
  35399 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlah_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  35400   int32x2_t __ret;
  35401   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  35402   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  35403   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  35404   __ret = (int32x2_t) __builtin_neon_vqrdmlah_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2);
  35405   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  35406   return __ret;
  35407 }
  35408 __ai __attribute__((target("v8.1a,neon"))) int32x2_t __noswap_vqrdmlah_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  35409   int32x2_t __ret;
  35410   __ret = (int32x2_t) __builtin_neon_vqrdmlah_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
  35411   return __ret;
  35412 }
  35413 #endif
  35414 
  35415 #ifdef __LITTLE_ENDIAN__
  35416 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlah_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  35417   int16x4_t __ret;
  35418   __ret = (int16x4_t) __builtin_neon_vqrdmlah_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1);
  35419   return __ret;
  35420 }
  35421 #else
  35422 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlah_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  35423   int16x4_t __ret;
  35424   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35425   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35426   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  35427   __ret = (int16x4_t) __builtin_neon_vqrdmlah_s16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 1);
  35428   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35429   return __ret;
  35430 }
  35431 __ai __attribute__((target("v8.1a,neon"))) int16x4_t __noswap_vqrdmlah_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  35432   int16x4_t __ret;
  35433   __ret = (int16x4_t) __builtin_neon_vqrdmlah_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1);
  35434   return __ret;
  35435 }
  35436 #endif
  35437 
  35438 #ifdef __LITTLE_ENDIAN__
  35439 #define vqrdmlahq_lane_s32(__p0_134, __p1_134, __p2_134, __p3_134) __extension__ ({ \
  35440   int32x4_t __ret_134; \
  35441   int32x4_t __s0_134 = __p0_134; \
  35442   int32x4_t __s1_134 = __p1_134; \
  35443   int32x2_t __s2_134 = __p2_134; \
  35444   __ret_134 = vqrdmlahq_s32(__s0_134, __s1_134, splatq_lane_s32(__s2_134, __p3_134)); \
  35445   __ret_134; \
  35446 })
  35447 #else
  35448 #define vqrdmlahq_lane_s32(__p0_135, __p1_135, __p2_135, __p3_135) __extension__ ({ \
  35449   int32x4_t __ret_135; \
  35450   int32x4_t __s0_135 = __p0_135; \
  35451   int32x4_t __s1_135 = __p1_135; \
  35452   int32x2_t __s2_135 = __p2_135; \
  35453   int32x4_t __rev0_135;  __rev0_135 = __builtin_shufflevector(__s0_135, __s0_135, 3, 2, 1, 0); \
  35454   int32x4_t __rev1_135;  __rev1_135 = __builtin_shufflevector(__s1_135, __s1_135, 3, 2, 1, 0); \
  35455   int32x2_t __rev2_135;  __rev2_135 = __builtin_shufflevector(__s2_135, __s2_135, 1, 0); \
  35456   __ret_135 = __noswap_vqrdmlahq_s32(__rev0_135, __rev1_135, __noswap_splatq_lane_s32(__rev2_135, __p3_135)); \
  35457   __ret_135 = __builtin_shufflevector(__ret_135, __ret_135, 3, 2, 1, 0); \
  35458   __ret_135; \
  35459 })
  35460 #endif
  35461 
  35462 #ifdef __LITTLE_ENDIAN__
  35463 #define vqrdmlahq_lane_s16(__p0_136, __p1_136, __p2_136, __p3_136) __extension__ ({ \
  35464   int16x8_t __ret_136; \
  35465   int16x8_t __s0_136 = __p0_136; \
  35466   int16x8_t __s1_136 = __p1_136; \
  35467   int16x4_t __s2_136 = __p2_136; \
  35468   __ret_136 = vqrdmlahq_s16(__s0_136, __s1_136, splatq_lane_s16(__s2_136, __p3_136)); \
  35469   __ret_136; \
  35470 })
  35471 #else
  35472 #define vqrdmlahq_lane_s16(__p0_137, __p1_137, __p2_137, __p3_137) __extension__ ({ \
  35473   int16x8_t __ret_137; \
  35474   int16x8_t __s0_137 = __p0_137; \
  35475   int16x8_t __s1_137 = __p1_137; \
  35476   int16x4_t __s2_137 = __p2_137; \
  35477   int16x8_t __rev0_137;  __rev0_137 = __builtin_shufflevector(__s0_137, __s0_137, 7, 6, 5, 4, 3, 2, 1, 0); \
  35478   int16x8_t __rev1_137;  __rev1_137 = __builtin_shufflevector(__s1_137, __s1_137, 7, 6, 5, 4, 3, 2, 1, 0); \
  35479   int16x4_t __rev2_137;  __rev2_137 = __builtin_shufflevector(__s2_137, __s2_137, 3, 2, 1, 0); \
  35480   __ret_137 = __noswap_vqrdmlahq_s16(__rev0_137, __rev1_137, __noswap_splatq_lane_s16(__rev2_137, __p3_137)); \
  35481   __ret_137 = __builtin_shufflevector(__ret_137, __ret_137, 7, 6, 5, 4, 3, 2, 1, 0); \
  35482   __ret_137; \
  35483 })
  35484 #endif
  35485 
  35486 #ifdef __LITTLE_ENDIAN__
  35487 #define vqrdmlah_lane_s32(__p0_138, __p1_138, __p2_138, __p3_138) __extension__ ({ \
  35488   int32x2_t __ret_138; \
  35489   int32x2_t __s0_138 = __p0_138; \
  35490   int32x2_t __s1_138 = __p1_138; \
  35491   int32x2_t __s2_138 = __p2_138; \
  35492   __ret_138 = vqrdmlah_s32(__s0_138, __s1_138, splat_lane_s32(__s2_138, __p3_138)); \
  35493   __ret_138; \
  35494 })
  35495 #else
  35496 #define vqrdmlah_lane_s32(__p0_139, __p1_139, __p2_139, __p3_139) __extension__ ({ \
  35497   int32x2_t __ret_139; \
  35498   int32x2_t __s0_139 = __p0_139; \
  35499   int32x2_t __s1_139 = __p1_139; \
  35500   int32x2_t __s2_139 = __p2_139; \
  35501   int32x2_t __rev0_139;  __rev0_139 = __builtin_shufflevector(__s0_139, __s0_139, 1, 0); \
  35502   int32x2_t __rev1_139;  __rev1_139 = __builtin_shufflevector(__s1_139, __s1_139, 1, 0); \
  35503   int32x2_t __rev2_139;  __rev2_139 = __builtin_shufflevector(__s2_139, __s2_139, 1, 0); \
  35504   __ret_139 = __noswap_vqrdmlah_s32(__rev0_139, __rev1_139, __noswap_splat_lane_s32(__rev2_139, __p3_139)); \
  35505   __ret_139 = __builtin_shufflevector(__ret_139, __ret_139, 1, 0); \
  35506   __ret_139; \
  35507 })
  35508 #endif
  35509 
  35510 #ifdef __LITTLE_ENDIAN__
  35511 #define vqrdmlah_lane_s16(__p0_140, __p1_140, __p2_140, __p3_140) __extension__ ({ \
  35512   int16x4_t __ret_140; \
  35513   int16x4_t __s0_140 = __p0_140; \
  35514   int16x4_t __s1_140 = __p1_140; \
  35515   int16x4_t __s2_140 = __p2_140; \
  35516   __ret_140 = vqrdmlah_s16(__s0_140, __s1_140, splat_lane_s16(__s2_140, __p3_140)); \
  35517   __ret_140; \
  35518 })
  35519 #else
  35520 #define vqrdmlah_lane_s16(__p0_141, __p1_141, __p2_141, __p3_141) __extension__ ({ \
  35521   int16x4_t __ret_141; \
  35522   int16x4_t __s0_141 = __p0_141; \
  35523   int16x4_t __s1_141 = __p1_141; \
  35524   int16x4_t __s2_141 = __p2_141; \
  35525   int16x4_t __rev0_141;  __rev0_141 = __builtin_shufflevector(__s0_141, __s0_141, 3, 2, 1, 0); \
  35526   int16x4_t __rev1_141;  __rev1_141 = __builtin_shufflevector(__s1_141, __s1_141, 3, 2, 1, 0); \
  35527   int16x4_t __rev2_141;  __rev2_141 = __builtin_shufflevector(__s2_141, __s2_141, 3, 2, 1, 0); \
  35528   __ret_141 = __noswap_vqrdmlah_s16(__rev0_141, __rev1_141, __noswap_splat_lane_s16(__rev2_141, __p3_141)); \
  35529   __ret_141 = __builtin_shufflevector(__ret_141, __ret_141, 3, 2, 1, 0); \
  35530   __ret_141; \
  35531 })
  35532 #endif
  35533 
  35534 #ifdef __LITTLE_ENDIAN__
  35535 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlshq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  35536   int32x4_t __ret;
  35537   __ret = (int32x4_t) __builtin_neon_vqrdmlshq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
  35538   return __ret;
  35539 }
  35540 #else
  35541 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlshq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  35542   int32x4_t __ret;
  35543   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35544   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35545   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  35546   __ret = (int32x4_t) __builtin_neon_vqrdmlshq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
  35547   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35548   return __ret;
  35549 }
  35550 __ai __attribute__((target("v8.1a,neon"))) int32x4_t __noswap_vqrdmlshq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  35551   int32x4_t __ret;
  35552   __ret = (int32x4_t) __builtin_neon_vqrdmlshq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
  35553   return __ret;
  35554 }
  35555 #endif
  35556 
  35557 #ifdef __LITTLE_ENDIAN__
  35558 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlshq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  35559   int16x8_t __ret;
  35560   __ret = (int16x8_t) __builtin_neon_vqrdmlshq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
  35561   return __ret;
  35562 }
  35563 #else
  35564 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlshq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  35565   int16x8_t __ret;
  35566   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35567   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35568   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  35569   __ret = (int16x8_t) __builtin_neon_vqrdmlshq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33);
  35570   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  35571   return __ret;
  35572 }
  35573 __ai __attribute__((target("v8.1a,neon"))) int16x8_t __noswap_vqrdmlshq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  35574   int16x8_t __ret;
  35575   __ret = (int16x8_t) __builtin_neon_vqrdmlshq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
  35576   return __ret;
  35577 }
  35578 #endif
  35579 
  35580 #ifdef __LITTLE_ENDIAN__
  35581 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlsh_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  35582   int32x2_t __ret;
  35583   __ret = (int32x2_t) __builtin_neon_vqrdmlsh_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
  35584   return __ret;
  35585 }
  35586 #else
  35587 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlsh_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  35588   int32x2_t __ret;
  35589   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  35590   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  35591   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  35592   __ret = (int32x2_t) __builtin_neon_vqrdmlsh_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2);
  35593   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  35594   return __ret;
  35595 }
  35596 __ai __attribute__((target("v8.1a,neon"))) int32x2_t __noswap_vqrdmlsh_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  35597   int32x2_t __ret;
  35598   __ret = (int32x2_t) __builtin_neon_vqrdmlsh_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2);
  35599   return __ret;
  35600 }
  35601 #endif
  35602 
  35603 #ifdef __LITTLE_ENDIAN__
  35604 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlsh_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  35605   int16x4_t __ret;
  35606   __ret = (int16x4_t) __builtin_neon_vqrdmlsh_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1);
  35607   return __ret;
  35608 }
  35609 #else
  35610 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlsh_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  35611   int16x4_t __ret;
  35612   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35613   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35614   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  35615   __ret = (int16x4_t) __builtin_neon_vqrdmlsh_s16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 1);
  35616   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35617   return __ret;
  35618 }
  35619 __ai __attribute__((target("v8.1a,neon"))) int16x4_t __noswap_vqrdmlsh_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  35620   int16x4_t __ret;
  35621   __ret = (int16x4_t) __builtin_neon_vqrdmlsh_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1);
  35622   return __ret;
  35623 }
  35624 #endif
  35625 
  35626 #ifdef __LITTLE_ENDIAN__
  35627 #define vqrdmlshq_lane_s32(__p0_142, __p1_142, __p2_142, __p3_142) __extension__ ({ \
  35628   int32x4_t __ret_142; \
  35629   int32x4_t __s0_142 = __p0_142; \
  35630   int32x4_t __s1_142 = __p1_142; \
  35631   int32x2_t __s2_142 = __p2_142; \
  35632   __ret_142 = vqrdmlshq_s32(__s0_142, __s1_142, splatq_lane_s32(__s2_142, __p3_142)); \
  35633   __ret_142; \
  35634 })
  35635 #else
  35636 #define vqrdmlshq_lane_s32(__p0_143, __p1_143, __p2_143, __p3_143) __extension__ ({ \
  35637   int32x4_t __ret_143; \
  35638   int32x4_t __s0_143 = __p0_143; \
  35639   int32x4_t __s1_143 = __p1_143; \
  35640   int32x2_t __s2_143 = __p2_143; \
  35641   int32x4_t __rev0_143;  __rev0_143 = __builtin_shufflevector(__s0_143, __s0_143, 3, 2, 1, 0); \
  35642   int32x4_t __rev1_143;  __rev1_143 = __builtin_shufflevector(__s1_143, __s1_143, 3, 2, 1, 0); \
  35643   int32x2_t __rev2_143;  __rev2_143 = __builtin_shufflevector(__s2_143, __s2_143, 1, 0); \
  35644   __ret_143 = __noswap_vqrdmlshq_s32(__rev0_143, __rev1_143, __noswap_splatq_lane_s32(__rev2_143, __p3_143)); \
  35645   __ret_143 = __builtin_shufflevector(__ret_143, __ret_143, 3, 2, 1, 0); \
  35646   __ret_143; \
  35647 })
  35648 #endif
  35649 
  35650 #ifdef __LITTLE_ENDIAN__
  35651 #define vqrdmlshq_lane_s16(__p0_144, __p1_144, __p2_144, __p3_144) __extension__ ({ \
  35652   int16x8_t __ret_144; \
  35653   int16x8_t __s0_144 = __p0_144; \
  35654   int16x8_t __s1_144 = __p1_144; \
  35655   int16x4_t __s2_144 = __p2_144; \
  35656   __ret_144 = vqrdmlshq_s16(__s0_144, __s1_144, splatq_lane_s16(__s2_144, __p3_144)); \
  35657   __ret_144; \
  35658 })
  35659 #else
  35660 #define vqrdmlshq_lane_s16(__p0_145, __p1_145, __p2_145, __p3_145) __extension__ ({ \
  35661   int16x8_t __ret_145; \
  35662   int16x8_t __s0_145 = __p0_145; \
  35663   int16x8_t __s1_145 = __p1_145; \
  35664   int16x4_t __s2_145 = __p2_145; \
  35665   int16x8_t __rev0_145;  __rev0_145 = __builtin_shufflevector(__s0_145, __s0_145, 7, 6, 5, 4, 3, 2, 1, 0); \
  35666   int16x8_t __rev1_145;  __rev1_145 = __builtin_shufflevector(__s1_145, __s1_145, 7, 6, 5, 4, 3, 2, 1, 0); \
  35667   int16x4_t __rev2_145;  __rev2_145 = __builtin_shufflevector(__s2_145, __s2_145, 3, 2, 1, 0); \
  35668   __ret_145 = __noswap_vqrdmlshq_s16(__rev0_145, __rev1_145, __noswap_splatq_lane_s16(__rev2_145, __p3_145)); \
  35669   __ret_145 = __builtin_shufflevector(__ret_145, __ret_145, 7, 6, 5, 4, 3, 2, 1, 0); \
  35670   __ret_145; \
  35671 })
  35672 #endif
  35673 
  35674 #ifdef __LITTLE_ENDIAN__
  35675 #define vqrdmlsh_lane_s32(__p0_146, __p1_146, __p2_146, __p3_146) __extension__ ({ \
  35676   int32x2_t __ret_146; \
  35677   int32x2_t __s0_146 = __p0_146; \
  35678   int32x2_t __s1_146 = __p1_146; \
  35679   int32x2_t __s2_146 = __p2_146; \
  35680   __ret_146 = vqrdmlsh_s32(__s0_146, __s1_146, splat_lane_s32(__s2_146, __p3_146)); \
  35681   __ret_146; \
  35682 })
  35683 #else
  35684 #define vqrdmlsh_lane_s32(__p0_147, __p1_147, __p2_147, __p3_147) __extension__ ({ \
  35685   int32x2_t __ret_147; \
  35686   int32x2_t __s0_147 = __p0_147; \
  35687   int32x2_t __s1_147 = __p1_147; \
  35688   int32x2_t __s2_147 = __p2_147; \
  35689   int32x2_t __rev0_147;  __rev0_147 = __builtin_shufflevector(__s0_147, __s0_147, 1, 0); \
  35690   int32x2_t __rev1_147;  __rev1_147 = __builtin_shufflevector(__s1_147, __s1_147, 1, 0); \
  35691   int32x2_t __rev2_147;  __rev2_147 = __builtin_shufflevector(__s2_147, __s2_147, 1, 0); \
  35692   __ret_147 = __noswap_vqrdmlsh_s32(__rev0_147, __rev1_147, __noswap_splat_lane_s32(__rev2_147, __p3_147)); \
  35693   __ret_147 = __builtin_shufflevector(__ret_147, __ret_147, 1, 0); \
  35694   __ret_147; \
  35695 })
  35696 #endif
  35697 
  35698 #ifdef __LITTLE_ENDIAN__
  35699 #define vqrdmlsh_lane_s16(__p0_148, __p1_148, __p2_148, __p3_148) __extension__ ({ \
  35700   int16x4_t __ret_148; \
  35701   int16x4_t __s0_148 = __p0_148; \
  35702   int16x4_t __s1_148 = __p1_148; \
  35703   int16x4_t __s2_148 = __p2_148; \
  35704   __ret_148 = vqrdmlsh_s16(__s0_148, __s1_148, splat_lane_s16(__s2_148, __p3_148)); \
  35705   __ret_148; \
  35706 })
  35707 #else
  35708 #define vqrdmlsh_lane_s16(__p0_149, __p1_149, __p2_149, __p3_149) __extension__ ({ \
  35709   int16x4_t __ret_149; \
  35710   int16x4_t __s0_149 = __p0_149; \
  35711   int16x4_t __s1_149 = __p1_149; \
  35712   int16x4_t __s2_149 = __p2_149; \
  35713   int16x4_t __rev0_149;  __rev0_149 = __builtin_shufflevector(__s0_149, __s0_149, 3, 2, 1, 0); \
  35714   int16x4_t __rev1_149;  __rev1_149 = __builtin_shufflevector(__s1_149, __s1_149, 3, 2, 1, 0); \
  35715   int16x4_t __rev2_149;  __rev2_149 = __builtin_shufflevector(__s2_149, __s2_149, 3, 2, 1, 0); \
  35716   __ret_149 = __noswap_vqrdmlsh_s16(__rev0_149, __rev1_149, __noswap_splat_lane_s16(__rev2_149, __p3_149)); \
  35717   __ret_149 = __builtin_shufflevector(__ret_149, __ret_149, 3, 2, 1, 0); \
  35718   __ret_149; \
  35719 })
  35720 #endif
  35721 
  35722 #ifdef __LITTLE_ENDIAN__
  35723 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot270_f16(float16x4_t __p0, float16x4_t __p1) {
  35724   float16x4_t __ret;
  35725   __ret = (float16x4_t) __builtin_neon_vcadd_rot270_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  35726   return __ret;
  35727 }
  35728 #else
  35729 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot270_f16(float16x4_t __p0, float16x4_t __p1) {
  35730   float16x4_t __ret;
  35731   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35732   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35733   __ret = (float16x4_t) __builtin_neon_vcadd_rot270_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  35734   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35735   return __ret;
  35736 }
  35737 #endif
  35738 
  35739 #ifdef __LITTLE_ENDIAN__
  35740 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot90_f16(float16x4_t __p0, float16x4_t __p1) {
  35741   float16x4_t __ret;
  35742   __ret = (float16x4_t) __builtin_neon_vcadd_rot90_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  35743   return __ret;
  35744 }
  35745 #else
  35746 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot90_f16(float16x4_t __p0, float16x4_t __p1) {
  35747   float16x4_t __ret;
  35748   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35749   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35750   __ret = (float16x4_t) __builtin_neon_vcadd_rot90_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  35751   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35752   return __ret;
  35753 }
  35754 #endif
  35755 
  35756 #ifdef __LITTLE_ENDIAN__
  35757 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot270_f16(float16x8_t __p0, float16x8_t __p1) {
  35758   float16x8_t __ret;
  35759   __ret = (float16x8_t) __builtin_neon_vcaddq_rot270_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  35760   return __ret;
  35761 }
  35762 #else
  35763 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot270_f16(float16x8_t __p0, float16x8_t __p1) {
  35764   float16x8_t __ret;
  35765   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35766   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35767   __ret = (float16x8_t) __builtin_neon_vcaddq_rot270_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  35768   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  35769   return __ret;
  35770 }
  35771 #endif
  35772 
  35773 #ifdef __LITTLE_ENDIAN__
  35774 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot90_f16(float16x8_t __p0, float16x8_t __p1) {
  35775   float16x8_t __ret;
  35776   __ret = (float16x8_t) __builtin_neon_vcaddq_rot90_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  35777   return __ret;
  35778 }
  35779 #else
  35780 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot90_f16(float16x8_t __p0, float16x8_t __p1) {
  35781   float16x8_t __ret;
  35782   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35783   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35784   __ret = (float16x8_t) __builtin_neon_vcaddq_rot90_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  35785   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  35786   return __ret;
  35787 }
  35788 #endif
  35789 
  35790 #ifdef __LITTLE_ENDIAN__
  35791 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  35792   float16x8_t __ret;
  35793   __ret = (float16x8_t) __builtin_neon_vcmlaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  35794   return __ret;
  35795 }
  35796 #else
  35797 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  35798   float16x8_t __ret;
  35799   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35800   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35801   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  35802   __ret = (float16x8_t) __builtin_neon_vcmlaq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40);
  35803   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  35804   return __ret;
  35805 }
  35806 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  35807   float16x8_t __ret;
  35808   __ret = (float16x8_t) __builtin_neon_vcmlaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  35809   return __ret;
  35810 }
  35811 #endif
  35812 
  35813 #ifdef __LITTLE_ENDIAN__
  35814 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  35815   float16x4_t __ret;
  35816   __ret = (float16x4_t) __builtin_neon_vcmla_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  35817   return __ret;
  35818 }
  35819 #else
  35820 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  35821   float16x4_t __ret;
  35822   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35823   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35824   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  35825   __ret = (float16x4_t) __builtin_neon_vcmla_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8);
  35826   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35827   return __ret;
  35828 }
  35829 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  35830   float16x4_t __ret;
  35831   __ret = (float16x4_t) __builtin_neon_vcmla_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  35832   return __ret;
  35833 }
  35834 #endif
  35835 
  35836 #ifdef __LITTLE_ENDIAN__
  35837 #define vcmla_lane_f16(__p0_150, __p1_150, __p2_150, __p3_150) __extension__ ({ \
  35838   float16x4_t __ret_150; \
  35839   float16x4_t __s0_150 = __p0_150; \
  35840   float16x4_t __s1_150 = __p1_150; \
  35841   float16x4_t __s2_150 = __p2_150; \
  35842   __ret_150 = vcmla_f16(__s0_150, __s1_150, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_150), __p3_150), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_150), __p3_150)})); \
  35843   __ret_150; \
  35844 })
  35845 #else
  35846 #define vcmla_lane_f16(__p0_151, __p1_151, __p2_151, __p3_151) __extension__ ({ \
  35847   float16x4_t __ret_151; \
  35848   float16x4_t __s0_151 = __p0_151; \
  35849   float16x4_t __s1_151 = __p1_151; \
  35850   float16x4_t __s2_151 = __p2_151; \
  35851   float16x4_t __rev0_151;  __rev0_151 = __builtin_shufflevector(__s0_151, __s0_151, 3, 2, 1, 0); \
  35852   float16x4_t __rev1_151;  __rev1_151 = __builtin_shufflevector(__s1_151, __s1_151, 3, 2, 1, 0); \
  35853   float16x4_t __rev2_151;  __rev2_151 = __builtin_shufflevector(__s2_151, __s2_151, 3, 2, 1, 0); \
  35854   __ret_151 = __noswap_vcmla_f16(__rev0_151, __rev1_151, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_151), __p3_151), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_151), __p3_151)})); \
  35855   __ret_151 = __builtin_shufflevector(__ret_151, __ret_151, 3, 2, 1, 0); \
  35856   __ret_151; \
  35857 })
  35858 #endif
  35859 
  35860 #ifdef __LITTLE_ENDIAN__
  35861 #define vcmlaq_lane_f16(__p0_152, __p1_152, __p2_152, __p3_152) __extension__ ({ \
  35862   float16x8_t __ret_152; \
  35863   float16x8_t __s0_152 = __p0_152; \
  35864   float16x8_t __s1_152 = __p1_152; \
  35865   float16x4_t __s2_152 = __p2_152; \
  35866   __ret_152 = vcmlaq_f16(__s0_152, __s1_152, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152)})); \
  35867   __ret_152; \
  35868 })
  35869 #else
  35870 #define vcmlaq_lane_f16(__p0_153, __p1_153, __p2_153, __p3_153) __extension__ ({ \
  35871   float16x8_t __ret_153; \
  35872   float16x8_t __s0_153 = __p0_153; \
  35873   float16x8_t __s1_153 = __p1_153; \
  35874   float16x4_t __s2_153 = __p2_153; \
  35875   float16x8_t __rev0_153;  __rev0_153 = __builtin_shufflevector(__s0_153, __s0_153, 7, 6, 5, 4, 3, 2, 1, 0); \
  35876   float16x8_t __rev1_153;  __rev1_153 = __builtin_shufflevector(__s1_153, __s1_153, 7, 6, 5, 4, 3, 2, 1, 0); \
  35877   float16x4_t __rev2_153;  __rev2_153 = __builtin_shufflevector(__s2_153, __s2_153, 3, 2, 1, 0); \
  35878   __ret_153 = __noswap_vcmlaq_f16(__rev0_153, __rev1_153, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153)})); \
  35879   __ret_153 = __builtin_shufflevector(__ret_153, __ret_153, 7, 6, 5, 4, 3, 2, 1, 0); \
  35880   __ret_153; \
  35881 })
  35882 #endif
  35883 
  35884 #ifdef __LITTLE_ENDIAN__
  35885 #define vcmla_laneq_f16(__p0_154, __p1_154, __p2_154, __p3_154) __extension__ ({ \
  35886   float16x4_t __ret_154; \
  35887   float16x4_t __s0_154 = __p0_154; \
  35888   float16x4_t __s1_154 = __p1_154; \
  35889   float16x8_t __s2_154 = __p2_154; \
  35890   __ret_154 = vcmla_f16(__s0_154, __s1_154, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_154), __p3_154), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_154), __p3_154)})); \
  35891   __ret_154; \
  35892 })
  35893 #else
  35894 #define vcmla_laneq_f16(__p0_155, __p1_155, __p2_155, __p3_155) __extension__ ({ \
  35895   float16x4_t __ret_155; \
  35896   float16x4_t __s0_155 = __p0_155; \
  35897   float16x4_t __s1_155 = __p1_155; \
  35898   float16x8_t __s2_155 = __p2_155; \
  35899   float16x4_t __rev0_155;  __rev0_155 = __builtin_shufflevector(__s0_155, __s0_155, 3, 2, 1, 0); \
  35900   float16x4_t __rev1_155;  __rev1_155 = __builtin_shufflevector(__s1_155, __s1_155, 3, 2, 1, 0); \
  35901   float16x8_t __rev2_155;  __rev2_155 = __builtin_shufflevector(__s2_155, __s2_155, 7, 6, 5, 4, 3, 2, 1, 0); \
  35902   __ret_155 = __noswap_vcmla_f16(__rev0_155, __rev1_155, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_155), __p3_155), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_155), __p3_155)})); \
  35903   __ret_155 = __builtin_shufflevector(__ret_155, __ret_155, 3, 2, 1, 0); \
  35904   __ret_155; \
  35905 })
  35906 #endif
  35907 
  35908 #ifdef __LITTLE_ENDIAN__
  35909 #define vcmlaq_laneq_f16(__p0_156, __p1_156, __p2_156, __p3_156) __extension__ ({ \
  35910   float16x8_t __ret_156; \
  35911   float16x8_t __s0_156 = __p0_156; \
  35912   float16x8_t __s1_156 = __p1_156; \
  35913   float16x8_t __s2_156 = __p2_156; \
  35914   __ret_156 = vcmlaq_f16(__s0_156, __s1_156, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156)})); \
  35915   __ret_156; \
  35916 })
  35917 #else
  35918 #define vcmlaq_laneq_f16(__p0_157, __p1_157, __p2_157, __p3_157) __extension__ ({ \
  35919   float16x8_t __ret_157; \
  35920   float16x8_t __s0_157 = __p0_157; \
  35921   float16x8_t __s1_157 = __p1_157; \
  35922   float16x8_t __s2_157 = __p2_157; \
  35923   float16x8_t __rev0_157;  __rev0_157 = __builtin_shufflevector(__s0_157, __s0_157, 7, 6, 5, 4, 3, 2, 1, 0); \
  35924   float16x8_t __rev1_157;  __rev1_157 = __builtin_shufflevector(__s1_157, __s1_157, 7, 6, 5, 4, 3, 2, 1, 0); \
  35925   float16x8_t __rev2_157;  __rev2_157 = __builtin_shufflevector(__s2_157, __s2_157, 7, 6, 5, 4, 3, 2, 1, 0); \
  35926   __ret_157 = __noswap_vcmlaq_f16(__rev0_157, __rev1_157, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157)})); \
  35927   __ret_157 = __builtin_shufflevector(__ret_157, __ret_157, 7, 6, 5, 4, 3, 2, 1, 0); \
  35928   __ret_157; \
  35929 })
  35930 #endif
  35931 
  35932 #ifdef __LITTLE_ENDIAN__
  35933 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot180_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  35934   float16x8_t __ret;
  35935   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot180_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  35936   return __ret;
  35937 }
  35938 #else
  35939 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot180_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  35940   float16x8_t __ret;
  35941   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  35942   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  35943   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  35944   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot180_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40);
  35945   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  35946   return __ret;
  35947 }
  35948 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_rot180_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  35949   float16x8_t __ret;
  35950   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot180_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  35951   return __ret;
  35952 }
  35953 #endif
  35954 
  35955 #ifdef __LITTLE_ENDIAN__
  35956 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot180_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  35957   float16x4_t __ret;
  35958   __ret = (float16x4_t) __builtin_neon_vcmla_rot180_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  35959   return __ret;
  35960 }
  35961 #else
  35962 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot180_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  35963   float16x4_t __ret;
  35964   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  35965   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  35966   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  35967   __ret = (float16x4_t) __builtin_neon_vcmla_rot180_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8);
  35968   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  35969   return __ret;
  35970 }
  35971 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_rot180_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  35972   float16x4_t __ret;
  35973   __ret = (float16x4_t) __builtin_neon_vcmla_rot180_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  35974   return __ret;
  35975 }
  35976 #endif
  35977 
  35978 #ifdef __LITTLE_ENDIAN__
  35979 #define vcmla_rot180_lane_f16(__p0_158, __p1_158, __p2_158, __p3_158) __extension__ ({ \
  35980   float16x4_t __ret_158; \
  35981   float16x4_t __s0_158 = __p0_158; \
  35982   float16x4_t __s1_158 = __p1_158; \
  35983   float16x4_t __s2_158 = __p2_158; \
  35984   __ret_158 = vcmla_rot180_f16(__s0_158, __s1_158, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_158), __p3_158), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_158), __p3_158)})); \
  35985   __ret_158; \
  35986 })
  35987 #else
  35988 #define vcmla_rot180_lane_f16(__p0_159, __p1_159, __p2_159, __p3_159) __extension__ ({ \
  35989   float16x4_t __ret_159; \
  35990   float16x4_t __s0_159 = __p0_159; \
  35991   float16x4_t __s1_159 = __p1_159; \
  35992   float16x4_t __s2_159 = __p2_159; \
  35993   float16x4_t __rev0_159;  __rev0_159 = __builtin_shufflevector(__s0_159, __s0_159, 3, 2, 1, 0); \
  35994   float16x4_t __rev1_159;  __rev1_159 = __builtin_shufflevector(__s1_159, __s1_159, 3, 2, 1, 0); \
  35995   float16x4_t __rev2_159;  __rev2_159 = __builtin_shufflevector(__s2_159, __s2_159, 3, 2, 1, 0); \
  35996   __ret_159 = __noswap_vcmla_rot180_f16(__rev0_159, __rev1_159, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_159), __p3_159), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_159), __p3_159)})); \
  35997   __ret_159 = __builtin_shufflevector(__ret_159, __ret_159, 3, 2, 1, 0); \
  35998   __ret_159; \
  35999 })
  36000 #endif
  36001 
  36002 #ifdef __LITTLE_ENDIAN__
  36003 #define vcmlaq_rot180_lane_f16(__p0_160, __p1_160, __p2_160, __p3_160) __extension__ ({ \
  36004   float16x8_t __ret_160; \
  36005   float16x8_t __s0_160 = __p0_160; \
  36006   float16x8_t __s1_160 = __p1_160; \
  36007   float16x4_t __s2_160 = __p2_160; \
  36008   __ret_160 = vcmlaq_rot180_f16(__s0_160, __s1_160, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160)})); \
  36009   __ret_160; \
  36010 })
  36011 #else
  36012 #define vcmlaq_rot180_lane_f16(__p0_161, __p1_161, __p2_161, __p3_161) __extension__ ({ \
  36013   float16x8_t __ret_161; \
  36014   float16x8_t __s0_161 = __p0_161; \
  36015   float16x8_t __s1_161 = __p1_161; \
  36016   float16x4_t __s2_161 = __p2_161; \
  36017   float16x8_t __rev0_161;  __rev0_161 = __builtin_shufflevector(__s0_161, __s0_161, 7, 6, 5, 4, 3, 2, 1, 0); \
  36018   float16x8_t __rev1_161;  __rev1_161 = __builtin_shufflevector(__s1_161, __s1_161, 7, 6, 5, 4, 3, 2, 1, 0); \
  36019   float16x4_t __rev2_161;  __rev2_161 = __builtin_shufflevector(__s2_161, __s2_161, 3, 2, 1, 0); \
  36020   __ret_161 = __noswap_vcmlaq_rot180_f16(__rev0_161, __rev1_161, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161)})); \
  36021   __ret_161 = __builtin_shufflevector(__ret_161, __ret_161, 7, 6, 5, 4, 3, 2, 1, 0); \
  36022   __ret_161; \
  36023 })
  36024 #endif
  36025 
  36026 #ifdef __LITTLE_ENDIAN__
  36027 #define vcmla_rot180_laneq_f16(__p0_162, __p1_162, __p2_162, __p3_162) __extension__ ({ \
  36028   float16x4_t __ret_162; \
  36029   float16x4_t __s0_162 = __p0_162; \
  36030   float16x4_t __s1_162 = __p1_162; \
  36031   float16x8_t __s2_162 = __p2_162; \
  36032   __ret_162 = vcmla_rot180_f16(__s0_162, __s1_162, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_162), __p3_162), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_162), __p3_162)})); \
  36033   __ret_162; \
  36034 })
  36035 #else
  36036 #define vcmla_rot180_laneq_f16(__p0_163, __p1_163, __p2_163, __p3_163) __extension__ ({ \
  36037   float16x4_t __ret_163; \
  36038   float16x4_t __s0_163 = __p0_163; \
  36039   float16x4_t __s1_163 = __p1_163; \
  36040   float16x8_t __s2_163 = __p2_163; \
  36041   float16x4_t __rev0_163;  __rev0_163 = __builtin_shufflevector(__s0_163, __s0_163, 3, 2, 1, 0); \
  36042   float16x4_t __rev1_163;  __rev1_163 = __builtin_shufflevector(__s1_163, __s1_163, 3, 2, 1, 0); \
  36043   float16x8_t __rev2_163;  __rev2_163 = __builtin_shufflevector(__s2_163, __s2_163, 7, 6, 5, 4, 3, 2, 1, 0); \
  36044   __ret_163 = __noswap_vcmla_rot180_f16(__rev0_163, __rev1_163, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_163), __p3_163), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_163), __p3_163)})); \
  36045   __ret_163 = __builtin_shufflevector(__ret_163, __ret_163, 3, 2, 1, 0); \
  36046   __ret_163; \
  36047 })
  36048 #endif
  36049 
  36050 #ifdef __LITTLE_ENDIAN__
  36051 #define vcmlaq_rot180_laneq_f16(__p0_164, __p1_164, __p2_164, __p3_164) __extension__ ({ \
  36052   float16x8_t __ret_164; \
  36053   float16x8_t __s0_164 = __p0_164; \
  36054   float16x8_t __s1_164 = __p1_164; \
  36055   float16x8_t __s2_164 = __p2_164; \
  36056   __ret_164 = vcmlaq_rot180_f16(__s0_164, __s1_164, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164)})); \
  36057   __ret_164; \
  36058 })
  36059 #else
  36060 #define vcmlaq_rot180_laneq_f16(__p0_165, __p1_165, __p2_165, __p3_165) __extension__ ({ \
  36061   float16x8_t __ret_165; \
  36062   float16x8_t __s0_165 = __p0_165; \
  36063   float16x8_t __s1_165 = __p1_165; \
  36064   float16x8_t __s2_165 = __p2_165; \
  36065   float16x8_t __rev0_165;  __rev0_165 = __builtin_shufflevector(__s0_165, __s0_165, 7, 6, 5, 4, 3, 2, 1, 0); \
  36066   float16x8_t __rev1_165;  __rev1_165 = __builtin_shufflevector(__s1_165, __s1_165, 7, 6, 5, 4, 3, 2, 1, 0); \
  36067   float16x8_t __rev2_165;  __rev2_165 = __builtin_shufflevector(__s2_165, __s2_165, 7, 6, 5, 4, 3, 2, 1, 0); \
  36068   __ret_165 = __noswap_vcmlaq_rot180_f16(__rev0_165, __rev1_165, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165)})); \
  36069   __ret_165 = __builtin_shufflevector(__ret_165, __ret_165, 7, 6, 5, 4, 3, 2, 1, 0); \
  36070   __ret_165; \
  36071 })
  36072 #endif
  36073 
  36074 #ifdef __LITTLE_ENDIAN__
  36075 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot270_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  36076   float16x8_t __ret;
  36077   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot270_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  36078   return __ret;
  36079 }
  36080 #else
  36081 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot270_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  36082   float16x8_t __ret;
  36083   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  36084   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  36085   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  36086   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot270_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40);
  36087   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  36088   return __ret;
  36089 }
  36090 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_rot270_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  36091   float16x8_t __ret;
  36092   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot270_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  36093   return __ret;
  36094 }
  36095 #endif
  36096 
  36097 #ifdef __LITTLE_ENDIAN__
  36098 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot270_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  36099   float16x4_t __ret;
  36100   __ret = (float16x4_t) __builtin_neon_vcmla_rot270_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  36101   return __ret;
  36102 }
  36103 #else
  36104 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot270_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  36105   float16x4_t __ret;
  36106   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36107   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36108   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  36109   __ret = (float16x4_t) __builtin_neon_vcmla_rot270_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8);
  36110   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36111   return __ret;
  36112 }
  36113 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_rot270_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  36114   float16x4_t __ret;
  36115   __ret = (float16x4_t) __builtin_neon_vcmla_rot270_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  36116   return __ret;
  36117 }
  36118 #endif
  36119 
  36120 #ifdef __LITTLE_ENDIAN__
  36121 #define vcmla_rot270_lane_f16(__p0_166, __p1_166, __p2_166, __p3_166) __extension__ ({ \
  36122   float16x4_t __ret_166; \
  36123   float16x4_t __s0_166 = __p0_166; \
  36124   float16x4_t __s1_166 = __p1_166; \
  36125   float16x4_t __s2_166 = __p2_166; \
  36126   __ret_166 = vcmla_rot270_f16(__s0_166, __s1_166, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_166), __p3_166), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_166), __p3_166)})); \
  36127   __ret_166; \
  36128 })
  36129 #else
  36130 #define vcmla_rot270_lane_f16(__p0_167, __p1_167, __p2_167, __p3_167) __extension__ ({ \
  36131   float16x4_t __ret_167; \
  36132   float16x4_t __s0_167 = __p0_167; \
  36133   float16x4_t __s1_167 = __p1_167; \
  36134   float16x4_t __s2_167 = __p2_167; \
  36135   float16x4_t __rev0_167;  __rev0_167 = __builtin_shufflevector(__s0_167, __s0_167, 3, 2, 1, 0); \
  36136   float16x4_t __rev1_167;  __rev1_167 = __builtin_shufflevector(__s1_167, __s1_167, 3, 2, 1, 0); \
  36137   float16x4_t __rev2_167;  __rev2_167 = __builtin_shufflevector(__s2_167, __s2_167, 3, 2, 1, 0); \
  36138   __ret_167 = __noswap_vcmla_rot270_f16(__rev0_167, __rev1_167, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_167), __p3_167), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_167), __p3_167)})); \
  36139   __ret_167 = __builtin_shufflevector(__ret_167, __ret_167, 3, 2, 1, 0); \
  36140   __ret_167; \
  36141 })
  36142 #endif
  36143 
  36144 #ifdef __LITTLE_ENDIAN__
  36145 #define vcmlaq_rot270_lane_f16(__p0_168, __p1_168, __p2_168, __p3_168) __extension__ ({ \
  36146   float16x8_t __ret_168; \
  36147   float16x8_t __s0_168 = __p0_168; \
  36148   float16x8_t __s1_168 = __p1_168; \
  36149   float16x4_t __s2_168 = __p2_168; \
  36150   __ret_168 = vcmlaq_rot270_f16(__s0_168, __s1_168, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168)})); \
  36151   __ret_168; \
  36152 })
  36153 #else
  36154 #define vcmlaq_rot270_lane_f16(__p0_169, __p1_169, __p2_169, __p3_169) __extension__ ({ \
  36155   float16x8_t __ret_169; \
  36156   float16x8_t __s0_169 = __p0_169; \
  36157   float16x8_t __s1_169 = __p1_169; \
  36158   float16x4_t __s2_169 = __p2_169; \
  36159   float16x8_t __rev0_169;  __rev0_169 = __builtin_shufflevector(__s0_169, __s0_169, 7, 6, 5, 4, 3, 2, 1, 0); \
  36160   float16x8_t __rev1_169;  __rev1_169 = __builtin_shufflevector(__s1_169, __s1_169, 7, 6, 5, 4, 3, 2, 1, 0); \
  36161   float16x4_t __rev2_169;  __rev2_169 = __builtin_shufflevector(__s2_169, __s2_169, 3, 2, 1, 0); \
  36162   __ret_169 = __noswap_vcmlaq_rot270_f16(__rev0_169, __rev1_169, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169)})); \
  36163   __ret_169 = __builtin_shufflevector(__ret_169, __ret_169, 7, 6, 5, 4, 3, 2, 1, 0); \
  36164   __ret_169; \
  36165 })
  36166 #endif
  36167 
  36168 #ifdef __LITTLE_ENDIAN__
  36169 #define vcmla_rot270_laneq_f16(__p0_170, __p1_170, __p2_170, __p3_170) __extension__ ({ \
  36170   float16x4_t __ret_170; \
  36171   float16x4_t __s0_170 = __p0_170; \
  36172   float16x4_t __s1_170 = __p1_170; \
  36173   float16x8_t __s2_170 = __p2_170; \
  36174   __ret_170 = vcmla_rot270_f16(__s0_170, __s1_170, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_170), __p3_170), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_170), __p3_170)})); \
  36175   __ret_170; \
  36176 })
  36177 #else
  36178 #define vcmla_rot270_laneq_f16(__p0_171, __p1_171, __p2_171, __p3_171) __extension__ ({ \
  36179   float16x4_t __ret_171; \
  36180   float16x4_t __s0_171 = __p0_171; \
  36181   float16x4_t __s1_171 = __p1_171; \
  36182   float16x8_t __s2_171 = __p2_171; \
  36183   float16x4_t __rev0_171;  __rev0_171 = __builtin_shufflevector(__s0_171, __s0_171, 3, 2, 1, 0); \
  36184   float16x4_t __rev1_171;  __rev1_171 = __builtin_shufflevector(__s1_171, __s1_171, 3, 2, 1, 0); \
  36185   float16x8_t __rev2_171;  __rev2_171 = __builtin_shufflevector(__s2_171, __s2_171, 7, 6, 5, 4, 3, 2, 1, 0); \
  36186   __ret_171 = __noswap_vcmla_rot270_f16(__rev0_171, __rev1_171, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_171), __p3_171), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_171), __p3_171)})); \
  36187   __ret_171 = __builtin_shufflevector(__ret_171, __ret_171, 3, 2, 1, 0); \
  36188   __ret_171; \
  36189 })
  36190 #endif
  36191 
  36192 #ifdef __LITTLE_ENDIAN__
  36193 #define vcmlaq_rot270_laneq_f16(__p0_172, __p1_172, __p2_172, __p3_172) __extension__ ({ \
  36194   float16x8_t __ret_172; \
  36195   float16x8_t __s0_172 = __p0_172; \
  36196   float16x8_t __s1_172 = __p1_172; \
  36197   float16x8_t __s2_172 = __p2_172; \
  36198   __ret_172 = vcmlaq_rot270_f16(__s0_172, __s1_172, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172)})); \
  36199   __ret_172; \
  36200 })
  36201 #else
  36202 #define vcmlaq_rot270_laneq_f16(__p0_173, __p1_173, __p2_173, __p3_173) __extension__ ({ \
  36203   float16x8_t __ret_173; \
  36204   float16x8_t __s0_173 = __p0_173; \
  36205   float16x8_t __s1_173 = __p1_173; \
  36206   float16x8_t __s2_173 = __p2_173; \
  36207   float16x8_t __rev0_173;  __rev0_173 = __builtin_shufflevector(__s0_173, __s0_173, 7, 6, 5, 4, 3, 2, 1, 0); \
  36208   float16x8_t __rev1_173;  __rev1_173 = __builtin_shufflevector(__s1_173, __s1_173, 7, 6, 5, 4, 3, 2, 1, 0); \
  36209   float16x8_t __rev2_173;  __rev2_173 = __builtin_shufflevector(__s2_173, __s2_173, 7, 6, 5, 4, 3, 2, 1, 0); \
  36210   __ret_173 = __noswap_vcmlaq_rot270_f16(__rev0_173, __rev1_173, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173)})); \
  36211   __ret_173 = __builtin_shufflevector(__ret_173, __ret_173, 7, 6, 5, 4, 3, 2, 1, 0); \
  36212   __ret_173; \
  36213 })
  36214 #endif
  36215 
  36216 #ifdef __LITTLE_ENDIAN__
  36217 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot90_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  36218   float16x8_t __ret;
  36219   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot90_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  36220   return __ret;
  36221 }
  36222 #else
  36223 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot90_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  36224   float16x8_t __ret;
  36225   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  36226   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  36227   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  36228   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot90_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40);
  36229   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  36230   return __ret;
  36231 }
  36232 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_rot90_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) {
  36233   float16x8_t __ret;
  36234   __ret = (float16x8_t) __builtin_neon_vcmlaq_rot90_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40);
  36235   return __ret;
  36236 }
  36237 #endif
  36238 
  36239 #ifdef __LITTLE_ENDIAN__
  36240 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot90_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  36241   float16x4_t __ret;
  36242   __ret = (float16x4_t) __builtin_neon_vcmla_rot90_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  36243   return __ret;
  36244 }
  36245 #else
  36246 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot90_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  36247   float16x4_t __ret;
  36248   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36249   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36250   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  36251   __ret = (float16x4_t) __builtin_neon_vcmla_rot90_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8);
  36252   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36253   return __ret;
  36254 }
  36255 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_rot90_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) {
  36256   float16x4_t __ret;
  36257   __ret = (float16x4_t) __builtin_neon_vcmla_rot90_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8);
  36258   return __ret;
  36259 }
  36260 #endif
  36261 
  36262 #ifdef __LITTLE_ENDIAN__
  36263 #define vcmla_rot90_lane_f16(__p0_174, __p1_174, __p2_174, __p3_174) __extension__ ({ \
  36264   float16x4_t __ret_174; \
  36265   float16x4_t __s0_174 = __p0_174; \
  36266   float16x4_t __s1_174 = __p1_174; \
  36267   float16x4_t __s2_174 = __p2_174; \
  36268   __ret_174 = vcmla_rot90_f16(__s0_174, __s1_174, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_174), __p3_174), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_174), __p3_174)})); \
  36269   __ret_174; \
  36270 })
  36271 #else
  36272 #define vcmla_rot90_lane_f16(__p0_175, __p1_175, __p2_175, __p3_175) __extension__ ({ \
  36273   float16x4_t __ret_175; \
  36274   float16x4_t __s0_175 = __p0_175; \
  36275   float16x4_t __s1_175 = __p1_175; \
  36276   float16x4_t __s2_175 = __p2_175; \
  36277   float16x4_t __rev0_175;  __rev0_175 = __builtin_shufflevector(__s0_175, __s0_175, 3, 2, 1, 0); \
  36278   float16x4_t __rev1_175;  __rev1_175 = __builtin_shufflevector(__s1_175, __s1_175, 3, 2, 1, 0); \
  36279   float16x4_t __rev2_175;  __rev2_175 = __builtin_shufflevector(__s2_175, __s2_175, 3, 2, 1, 0); \
  36280   __ret_175 = __noswap_vcmla_rot90_f16(__rev0_175, __rev1_175, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_175), __p3_175), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_175), __p3_175)})); \
  36281   __ret_175 = __builtin_shufflevector(__ret_175, __ret_175, 3, 2, 1, 0); \
  36282   __ret_175; \
  36283 })
  36284 #endif
  36285 
  36286 #ifdef __LITTLE_ENDIAN__
  36287 #define vcmlaq_rot90_lane_f16(__p0_176, __p1_176, __p2_176, __p3_176) __extension__ ({ \
  36288   float16x8_t __ret_176; \
  36289   float16x8_t __s0_176 = __p0_176; \
  36290   float16x8_t __s1_176 = __p1_176; \
  36291   float16x4_t __s2_176 = __p2_176; \
  36292   __ret_176 = vcmlaq_rot90_f16(__s0_176, __s1_176, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176)})); \
  36293   __ret_176; \
  36294 })
  36295 #else
  36296 #define vcmlaq_rot90_lane_f16(__p0_177, __p1_177, __p2_177, __p3_177) __extension__ ({ \
  36297   float16x8_t __ret_177; \
  36298   float16x8_t __s0_177 = __p0_177; \
  36299   float16x8_t __s1_177 = __p1_177; \
  36300   float16x4_t __s2_177 = __p2_177; \
  36301   float16x8_t __rev0_177;  __rev0_177 = __builtin_shufflevector(__s0_177, __s0_177, 7, 6, 5, 4, 3, 2, 1, 0); \
  36302   float16x8_t __rev1_177;  __rev1_177 = __builtin_shufflevector(__s1_177, __s1_177, 7, 6, 5, 4, 3, 2, 1, 0); \
  36303   float16x4_t __rev2_177;  __rev2_177 = __builtin_shufflevector(__s2_177, __s2_177, 3, 2, 1, 0); \
  36304   __ret_177 = __noswap_vcmlaq_rot90_f16(__rev0_177, __rev1_177, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177)})); \
  36305   __ret_177 = __builtin_shufflevector(__ret_177, __ret_177, 7, 6, 5, 4, 3, 2, 1, 0); \
  36306   __ret_177; \
  36307 })
  36308 #endif
  36309 
  36310 #ifdef __LITTLE_ENDIAN__
  36311 #define vcmla_rot90_laneq_f16(__p0_178, __p1_178, __p2_178, __p3_178) __extension__ ({ \
  36312   float16x4_t __ret_178; \
  36313   float16x4_t __s0_178 = __p0_178; \
  36314   float16x4_t __s1_178 = __p1_178; \
  36315   float16x8_t __s2_178 = __p2_178; \
  36316   __ret_178 = vcmla_rot90_f16(__s0_178, __s1_178, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_178), __p3_178), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_178), __p3_178)})); \
  36317   __ret_178; \
  36318 })
  36319 #else
  36320 #define vcmla_rot90_laneq_f16(__p0_179, __p1_179, __p2_179, __p3_179) __extension__ ({ \
  36321   float16x4_t __ret_179; \
  36322   float16x4_t __s0_179 = __p0_179; \
  36323   float16x4_t __s1_179 = __p1_179; \
  36324   float16x8_t __s2_179 = __p2_179; \
  36325   float16x4_t __rev0_179;  __rev0_179 = __builtin_shufflevector(__s0_179, __s0_179, 3, 2, 1, 0); \
  36326   float16x4_t __rev1_179;  __rev1_179 = __builtin_shufflevector(__s1_179, __s1_179, 3, 2, 1, 0); \
  36327   float16x8_t __rev2_179;  __rev2_179 = __builtin_shufflevector(__s2_179, __s2_179, 7, 6, 5, 4, 3, 2, 1, 0); \
  36328   __ret_179 = __noswap_vcmla_rot90_f16(__rev0_179, __rev1_179, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_179), __p3_179), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_179), __p3_179)})); \
  36329   __ret_179 = __builtin_shufflevector(__ret_179, __ret_179, 3, 2, 1, 0); \
  36330   __ret_179; \
  36331 })
  36332 #endif
  36333 
  36334 #ifdef __LITTLE_ENDIAN__
  36335 #define vcmlaq_rot90_laneq_f16(__p0_180, __p1_180, __p2_180, __p3_180) __extension__ ({ \
  36336   float16x8_t __ret_180; \
  36337   float16x8_t __s0_180 = __p0_180; \
  36338   float16x8_t __s1_180 = __p1_180; \
  36339   float16x8_t __s2_180 = __p2_180; \
  36340   __ret_180 = vcmlaq_rot90_f16(__s0_180, __s1_180, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180)})); \
  36341   __ret_180; \
  36342 })
  36343 #else
  36344 #define vcmlaq_rot90_laneq_f16(__p0_181, __p1_181, __p2_181, __p3_181) __extension__ ({ \
  36345   float16x8_t __ret_181; \
  36346   float16x8_t __s0_181 = __p0_181; \
  36347   float16x8_t __s1_181 = __p1_181; \
  36348   float16x8_t __s2_181 = __p2_181; \
  36349   float16x8_t __rev0_181;  __rev0_181 = __builtin_shufflevector(__s0_181, __s0_181, 7, 6, 5, 4, 3, 2, 1, 0); \
  36350   float16x8_t __rev1_181;  __rev1_181 = __builtin_shufflevector(__s1_181, __s1_181, 7, 6, 5, 4, 3, 2, 1, 0); \
  36351   float16x8_t __rev2_181;  __rev2_181 = __builtin_shufflevector(__s2_181, __s2_181, 7, 6, 5, 4, 3, 2, 1, 0); \
  36352   __ret_181 = __noswap_vcmlaq_rot90_f16(__rev0_181, __rev1_181, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181)})); \
  36353   __ret_181 = __builtin_shufflevector(__ret_181, __ret_181, 7, 6, 5, 4, 3, 2, 1, 0); \
  36354   __ret_181; \
  36355 })
  36356 #endif
  36357 
  36358 #ifdef __LITTLE_ENDIAN__
  36359 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot270_f32(float32x2_t __p0, float32x2_t __p1) {
  36360   float32x2_t __ret;
  36361   __ret = (float32x2_t) __builtin_neon_vcadd_rot270_f32((int8x8_t)__p0, (int8x8_t)__p1, 9);
  36362   return __ret;
  36363 }
  36364 #else
  36365 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot270_f32(float32x2_t __p0, float32x2_t __p1) {
  36366   float32x2_t __ret;
  36367   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  36368   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  36369   __ret = (float32x2_t) __builtin_neon_vcadd_rot270_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  36370   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  36371   return __ret;
  36372 }
  36373 #endif
  36374 
  36375 #ifdef __LITTLE_ENDIAN__
  36376 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot90_f32(float32x2_t __p0, float32x2_t __p1) {
  36377   float32x2_t __ret;
  36378   __ret = (float32x2_t) __builtin_neon_vcadd_rot90_f32((int8x8_t)__p0, (int8x8_t)__p1, 9);
  36379   return __ret;
  36380 }
  36381 #else
  36382 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot90_f32(float32x2_t __p0, float32x2_t __p1) {
  36383   float32x2_t __ret;
  36384   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  36385   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  36386   __ret = (float32x2_t) __builtin_neon_vcadd_rot90_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  36387   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  36388   return __ret;
  36389 }
  36390 #endif
  36391 
  36392 #ifdef __LITTLE_ENDIAN__
  36393 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot270_f32(float32x4_t __p0, float32x4_t __p1) {
  36394   float32x4_t __ret;
  36395   __ret = (float32x4_t) __builtin_neon_vcaddq_rot270_f32((int8x16_t)__p0, (int8x16_t)__p1, 41);
  36396   return __ret;
  36397 }
  36398 #else
  36399 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot270_f32(float32x4_t __p0, float32x4_t __p1) {
  36400   float32x4_t __ret;
  36401   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36402   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36403   __ret = (float32x4_t) __builtin_neon_vcaddq_rot270_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  36404   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36405   return __ret;
  36406 }
  36407 #endif
  36408 
  36409 #ifdef __LITTLE_ENDIAN__
  36410 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot90_f32(float32x4_t __p0, float32x4_t __p1) {
  36411   float32x4_t __ret;
  36412   __ret = (float32x4_t) __builtin_neon_vcaddq_rot90_f32((int8x16_t)__p0, (int8x16_t)__p1, 41);
  36413   return __ret;
  36414 }
  36415 #else
  36416 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot90_f32(float32x4_t __p0, float32x4_t __p1) {
  36417   float32x4_t __ret;
  36418   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36419   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36420   __ret = (float32x4_t) __builtin_neon_vcaddq_rot90_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  36421   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36422   return __ret;
  36423 }
  36424 #endif
  36425 
  36426 #ifdef __LITTLE_ENDIAN__
  36427 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36428   float32x4_t __ret;
  36429   __ret = (float32x4_t) __builtin_neon_vcmlaq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36430   return __ret;
  36431 }
  36432 #else
  36433 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36434   float32x4_t __ret;
  36435   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36436   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36437   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  36438   __ret = (float32x4_t) __builtin_neon_vcmlaq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  36439   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36440   return __ret;
  36441 }
  36442 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36443   float32x4_t __ret;
  36444   __ret = (float32x4_t) __builtin_neon_vcmlaq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36445   return __ret;
  36446 }
  36447 #endif
  36448 
  36449 #ifdef __LITTLE_ENDIAN__
  36450 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36451   float32x2_t __ret;
  36452   __ret = (float32x2_t) __builtin_neon_vcmla_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36453   return __ret;
  36454 }
  36455 #else
  36456 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36457   float32x2_t __ret;
  36458   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  36459   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  36460   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  36461   __ret = (float32x2_t) __builtin_neon_vcmla_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  36462   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  36463   return __ret;
  36464 }
  36465 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36466   float32x2_t __ret;
  36467   __ret = (float32x2_t) __builtin_neon_vcmla_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36468   return __ret;
  36469 }
  36470 #endif
  36471 
  36472 #ifdef __LITTLE_ENDIAN__
  36473 #define vcmla_lane_f32(__p0_182, __p1_182, __p2_182, __p3_182) __extension__ ({ \
  36474   float32x2_t __ret_182; \
  36475   float32x2_t __s0_182 = __p0_182; \
  36476   float32x2_t __s1_182 = __p1_182; \
  36477   float32x2_t __s2_182 = __p2_182; \
  36478   __ret_182 = vcmla_f32(__s0_182, __s1_182, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_182), __p3_182)})); \
  36479   __ret_182; \
  36480 })
  36481 #else
  36482 #define vcmla_lane_f32(__p0_183, __p1_183, __p2_183, __p3_183) __extension__ ({ \
  36483   float32x2_t __ret_183; \
  36484   float32x2_t __s0_183 = __p0_183; \
  36485   float32x2_t __s1_183 = __p1_183; \
  36486   float32x2_t __s2_183 = __p2_183; \
  36487   float32x2_t __rev0_183;  __rev0_183 = __builtin_shufflevector(__s0_183, __s0_183, 1, 0); \
  36488   float32x2_t __rev1_183;  __rev1_183 = __builtin_shufflevector(__s1_183, __s1_183, 1, 0); \
  36489   float32x2_t __rev2_183;  __rev2_183 = __builtin_shufflevector(__s2_183, __s2_183, 1, 0); \
  36490   __ret_183 = __noswap_vcmla_f32(__rev0_183, __rev1_183, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_183), __p3_183)})); \
  36491   __ret_183 = __builtin_shufflevector(__ret_183, __ret_183, 1, 0); \
  36492   __ret_183; \
  36493 })
  36494 #endif
  36495 
  36496 #ifdef __LITTLE_ENDIAN__
  36497 #define vcmlaq_lane_f32(__p0_184, __p1_184, __p2_184, __p3_184) __extension__ ({ \
  36498   float32x4_t __ret_184; \
  36499   float32x4_t __s0_184 = __p0_184; \
  36500   float32x4_t __s1_184 = __p1_184; \
  36501   float32x2_t __s2_184 = __p2_184; \
  36502   __ret_184 = vcmlaq_f32(__s0_184, __s1_184, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_184), __p3_184), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_184), __p3_184)})); \
  36503   __ret_184; \
  36504 })
  36505 #else
  36506 #define vcmlaq_lane_f32(__p0_185, __p1_185, __p2_185, __p3_185) __extension__ ({ \
  36507   float32x4_t __ret_185; \
  36508   float32x4_t __s0_185 = __p0_185; \
  36509   float32x4_t __s1_185 = __p1_185; \
  36510   float32x2_t __s2_185 = __p2_185; \
  36511   float32x4_t __rev0_185;  __rev0_185 = __builtin_shufflevector(__s0_185, __s0_185, 3, 2, 1, 0); \
  36512   float32x4_t __rev1_185;  __rev1_185 = __builtin_shufflevector(__s1_185, __s1_185, 3, 2, 1, 0); \
  36513   float32x2_t __rev2_185;  __rev2_185 = __builtin_shufflevector(__s2_185, __s2_185, 1, 0); \
  36514   __ret_185 = __noswap_vcmlaq_f32(__rev0_185, __rev1_185, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_185), __p3_185), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_185), __p3_185)})); \
  36515   __ret_185 = __builtin_shufflevector(__ret_185, __ret_185, 3, 2, 1, 0); \
  36516   __ret_185; \
  36517 })
  36518 #endif
  36519 
  36520 #ifdef __LITTLE_ENDIAN__
  36521 #define vcmla_laneq_f32(__p0_186, __p1_186, __p2_186, __p3_186) __extension__ ({ \
  36522   float32x2_t __ret_186; \
  36523   float32x2_t __s0_186 = __p0_186; \
  36524   float32x2_t __s1_186 = __p1_186; \
  36525   float32x4_t __s2_186 = __p2_186; \
  36526   __ret_186 = vcmla_f32(__s0_186, __s1_186, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_186), __p3_186)})); \
  36527   __ret_186; \
  36528 })
  36529 #else
  36530 #define vcmla_laneq_f32(__p0_187, __p1_187, __p2_187, __p3_187) __extension__ ({ \
  36531   float32x2_t __ret_187; \
  36532   float32x2_t __s0_187 = __p0_187; \
  36533   float32x2_t __s1_187 = __p1_187; \
  36534   float32x4_t __s2_187 = __p2_187; \
  36535   float32x2_t __rev0_187;  __rev0_187 = __builtin_shufflevector(__s0_187, __s0_187, 1, 0); \
  36536   float32x2_t __rev1_187;  __rev1_187 = __builtin_shufflevector(__s1_187, __s1_187, 1, 0); \
  36537   float32x4_t __rev2_187;  __rev2_187 = __builtin_shufflevector(__s2_187, __s2_187, 3, 2, 1, 0); \
  36538   __ret_187 = __noswap_vcmla_f32(__rev0_187, __rev1_187, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_187), __p3_187)})); \
  36539   __ret_187 = __builtin_shufflevector(__ret_187, __ret_187, 1, 0); \
  36540   __ret_187; \
  36541 })
  36542 #endif
  36543 
  36544 #ifdef __LITTLE_ENDIAN__
  36545 #define vcmlaq_laneq_f32(__p0_188, __p1_188, __p2_188, __p3_188) __extension__ ({ \
  36546   float32x4_t __ret_188; \
  36547   float32x4_t __s0_188 = __p0_188; \
  36548   float32x4_t __s1_188 = __p1_188; \
  36549   float32x4_t __s2_188 = __p2_188; \
  36550   __ret_188 = vcmlaq_f32(__s0_188, __s1_188, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_188), __p3_188), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_188), __p3_188)})); \
  36551   __ret_188; \
  36552 })
  36553 #else
  36554 #define vcmlaq_laneq_f32(__p0_189, __p1_189, __p2_189, __p3_189) __extension__ ({ \
  36555   float32x4_t __ret_189; \
  36556   float32x4_t __s0_189 = __p0_189; \
  36557   float32x4_t __s1_189 = __p1_189; \
  36558   float32x4_t __s2_189 = __p2_189; \
  36559   float32x4_t __rev0_189;  __rev0_189 = __builtin_shufflevector(__s0_189, __s0_189, 3, 2, 1, 0); \
  36560   float32x4_t __rev1_189;  __rev1_189 = __builtin_shufflevector(__s1_189, __s1_189, 3, 2, 1, 0); \
  36561   float32x4_t __rev2_189;  __rev2_189 = __builtin_shufflevector(__s2_189, __s2_189, 3, 2, 1, 0); \
  36562   __ret_189 = __noswap_vcmlaq_f32(__rev0_189, __rev1_189, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_189), __p3_189), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_189), __p3_189)})); \
  36563   __ret_189 = __builtin_shufflevector(__ret_189, __ret_189, 3, 2, 1, 0); \
  36564   __ret_189; \
  36565 })
  36566 #endif
  36567 
  36568 #ifdef __LITTLE_ENDIAN__
  36569 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot180_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36570   float32x4_t __ret;
  36571   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot180_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36572   return __ret;
  36573 }
  36574 #else
  36575 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot180_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36576   float32x4_t __ret;
  36577   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36578   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36579   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  36580   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot180_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  36581   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36582   return __ret;
  36583 }
  36584 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_rot180_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36585   float32x4_t __ret;
  36586   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot180_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36587   return __ret;
  36588 }
  36589 #endif
  36590 
  36591 #ifdef __LITTLE_ENDIAN__
  36592 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot180_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36593   float32x2_t __ret;
  36594   __ret = (float32x2_t) __builtin_neon_vcmla_rot180_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36595   return __ret;
  36596 }
  36597 #else
  36598 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot180_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36599   float32x2_t __ret;
  36600   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  36601   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  36602   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  36603   __ret = (float32x2_t) __builtin_neon_vcmla_rot180_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  36604   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  36605   return __ret;
  36606 }
  36607 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_rot180_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36608   float32x2_t __ret;
  36609   __ret = (float32x2_t) __builtin_neon_vcmla_rot180_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36610   return __ret;
  36611 }
  36612 #endif
  36613 
  36614 #ifdef __LITTLE_ENDIAN__
  36615 #define vcmla_rot180_lane_f32(__p0_190, __p1_190, __p2_190, __p3_190) __extension__ ({ \
  36616   float32x2_t __ret_190; \
  36617   float32x2_t __s0_190 = __p0_190; \
  36618   float32x2_t __s1_190 = __p1_190; \
  36619   float32x2_t __s2_190 = __p2_190; \
  36620   __ret_190 = vcmla_rot180_f32(__s0_190, __s1_190, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_190), __p3_190)})); \
  36621   __ret_190; \
  36622 })
  36623 #else
  36624 #define vcmla_rot180_lane_f32(__p0_191, __p1_191, __p2_191, __p3_191) __extension__ ({ \
  36625   float32x2_t __ret_191; \
  36626   float32x2_t __s0_191 = __p0_191; \
  36627   float32x2_t __s1_191 = __p1_191; \
  36628   float32x2_t __s2_191 = __p2_191; \
  36629   float32x2_t __rev0_191;  __rev0_191 = __builtin_shufflevector(__s0_191, __s0_191, 1, 0); \
  36630   float32x2_t __rev1_191;  __rev1_191 = __builtin_shufflevector(__s1_191, __s1_191, 1, 0); \
  36631   float32x2_t __rev2_191;  __rev2_191 = __builtin_shufflevector(__s2_191, __s2_191, 1, 0); \
  36632   __ret_191 = __noswap_vcmla_rot180_f32(__rev0_191, __rev1_191, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_191), __p3_191)})); \
  36633   __ret_191 = __builtin_shufflevector(__ret_191, __ret_191, 1, 0); \
  36634   __ret_191; \
  36635 })
  36636 #endif
  36637 
  36638 #ifdef __LITTLE_ENDIAN__
  36639 #define vcmlaq_rot180_lane_f32(__p0_192, __p1_192, __p2_192, __p3_192) __extension__ ({ \
  36640   float32x4_t __ret_192; \
  36641   float32x4_t __s0_192 = __p0_192; \
  36642   float32x4_t __s1_192 = __p1_192; \
  36643   float32x2_t __s2_192 = __p2_192; \
  36644   __ret_192 = vcmlaq_rot180_f32(__s0_192, __s1_192, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_192), __p3_192), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_192), __p3_192)})); \
  36645   __ret_192; \
  36646 })
  36647 #else
  36648 #define vcmlaq_rot180_lane_f32(__p0_193, __p1_193, __p2_193, __p3_193) __extension__ ({ \
  36649   float32x4_t __ret_193; \
  36650   float32x4_t __s0_193 = __p0_193; \
  36651   float32x4_t __s1_193 = __p1_193; \
  36652   float32x2_t __s2_193 = __p2_193; \
  36653   float32x4_t __rev0_193;  __rev0_193 = __builtin_shufflevector(__s0_193, __s0_193, 3, 2, 1, 0); \
  36654   float32x4_t __rev1_193;  __rev1_193 = __builtin_shufflevector(__s1_193, __s1_193, 3, 2, 1, 0); \
  36655   float32x2_t __rev2_193;  __rev2_193 = __builtin_shufflevector(__s2_193, __s2_193, 1, 0); \
  36656   __ret_193 = __noswap_vcmlaq_rot180_f32(__rev0_193, __rev1_193, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_193), __p3_193), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_193), __p3_193)})); \
  36657   __ret_193 = __builtin_shufflevector(__ret_193, __ret_193, 3, 2, 1, 0); \
  36658   __ret_193; \
  36659 })
  36660 #endif
  36661 
  36662 #ifdef __LITTLE_ENDIAN__
  36663 #define vcmla_rot180_laneq_f32(__p0_194, __p1_194, __p2_194, __p3_194) __extension__ ({ \
  36664   float32x2_t __ret_194; \
  36665   float32x2_t __s0_194 = __p0_194; \
  36666   float32x2_t __s1_194 = __p1_194; \
  36667   float32x4_t __s2_194 = __p2_194; \
  36668   __ret_194 = vcmla_rot180_f32(__s0_194, __s1_194, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_194), __p3_194)})); \
  36669   __ret_194; \
  36670 })
  36671 #else
  36672 #define vcmla_rot180_laneq_f32(__p0_195, __p1_195, __p2_195, __p3_195) __extension__ ({ \
  36673   float32x2_t __ret_195; \
  36674   float32x2_t __s0_195 = __p0_195; \
  36675   float32x2_t __s1_195 = __p1_195; \
  36676   float32x4_t __s2_195 = __p2_195; \
  36677   float32x2_t __rev0_195;  __rev0_195 = __builtin_shufflevector(__s0_195, __s0_195, 1, 0); \
  36678   float32x2_t __rev1_195;  __rev1_195 = __builtin_shufflevector(__s1_195, __s1_195, 1, 0); \
  36679   float32x4_t __rev2_195;  __rev2_195 = __builtin_shufflevector(__s2_195, __s2_195, 3, 2, 1, 0); \
  36680   __ret_195 = __noswap_vcmla_rot180_f32(__rev0_195, __rev1_195, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_195), __p3_195)})); \
  36681   __ret_195 = __builtin_shufflevector(__ret_195, __ret_195, 1, 0); \
  36682   __ret_195; \
  36683 })
  36684 #endif
  36685 
  36686 #ifdef __LITTLE_ENDIAN__
  36687 #define vcmlaq_rot180_laneq_f32(__p0_196, __p1_196, __p2_196, __p3_196) __extension__ ({ \
  36688   float32x4_t __ret_196; \
  36689   float32x4_t __s0_196 = __p0_196; \
  36690   float32x4_t __s1_196 = __p1_196; \
  36691   float32x4_t __s2_196 = __p2_196; \
  36692   __ret_196 = vcmlaq_rot180_f32(__s0_196, __s1_196, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_196), __p3_196), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_196), __p3_196)})); \
  36693   __ret_196; \
  36694 })
  36695 #else
  36696 #define vcmlaq_rot180_laneq_f32(__p0_197, __p1_197, __p2_197, __p3_197) __extension__ ({ \
  36697   float32x4_t __ret_197; \
  36698   float32x4_t __s0_197 = __p0_197; \
  36699   float32x4_t __s1_197 = __p1_197; \
  36700   float32x4_t __s2_197 = __p2_197; \
  36701   float32x4_t __rev0_197;  __rev0_197 = __builtin_shufflevector(__s0_197, __s0_197, 3, 2, 1, 0); \
  36702   float32x4_t __rev1_197;  __rev1_197 = __builtin_shufflevector(__s1_197, __s1_197, 3, 2, 1, 0); \
  36703   float32x4_t __rev2_197;  __rev2_197 = __builtin_shufflevector(__s2_197, __s2_197, 3, 2, 1, 0); \
  36704   __ret_197 = __noswap_vcmlaq_rot180_f32(__rev0_197, __rev1_197, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_197), __p3_197), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_197), __p3_197)})); \
  36705   __ret_197 = __builtin_shufflevector(__ret_197, __ret_197, 3, 2, 1, 0); \
  36706   __ret_197; \
  36707 })
  36708 #endif
  36709 
  36710 #ifdef __LITTLE_ENDIAN__
  36711 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot270_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36712   float32x4_t __ret;
  36713   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot270_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36714   return __ret;
  36715 }
  36716 #else
  36717 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot270_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36718   float32x4_t __ret;
  36719   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36720   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36721   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  36722   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot270_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  36723   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36724   return __ret;
  36725 }
  36726 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_rot270_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36727   float32x4_t __ret;
  36728   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot270_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36729   return __ret;
  36730 }
  36731 #endif
  36732 
  36733 #ifdef __LITTLE_ENDIAN__
  36734 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot270_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36735   float32x2_t __ret;
  36736   __ret = (float32x2_t) __builtin_neon_vcmla_rot270_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36737   return __ret;
  36738 }
  36739 #else
  36740 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot270_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36741   float32x2_t __ret;
  36742   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  36743   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  36744   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  36745   __ret = (float32x2_t) __builtin_neon_vcmla_rot270_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  36746   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  36747   return __ret;
  36748 }
  36749 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_rot270_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36750   float32x2_t __ret;
  36751   __ret = (float32x2_t) __builtin_neon_vcmla_rot270_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36752   return __ret;
  36753 }
  36754 #endif
  36755 
  36756 #ifdef __LITTLE_ENDIAN__
  36757 #define vcmla_rot270_lane_f32(__p0_198, __p1_198, __p2_198, __p3_198) __extension__ ({ \
  36758   float32x2_t __ret_198; \
  36759   float32x2_t __s0_198 = __p0_198; \
  36760   float32x2_t __s1_198 = __p1_198; \
  36761   float32x2_t __s2_198 = __p2_198; \
  36762   __ret_198 = vcmla_rot270_f32(__s0_198, __s1_198, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_198), __p3_198)})); \
  36763   __ret_198; \
  36764 })
  36765 #else
  36766 #define vcmla_rot270_lane_f32(__p0_199, __p1_199, __p2_199, __p3_199) __extension__ ({ \
  36767   float32x2_t __ret_199; \
  36768   float32x2_t __s0_199 = __p0_199; \
  36769   float32x2_t __s1_199 = __p1_199; \
  36770   float32x2_t __s2_199 = __p2_199; \
  36771   float32x2_t __rev0_199;  __rev0_199 = __builtin_shufflevector(__s0_199, __s0_199, 1, 0); \
  36772   float32x2_t __rev1_199;  __rev1_199 = __builtin_shufflevector(__s1_199, __s1_199, 1, 0); \
  36773   float32x2_t __rev2_199;  __rev2_199 = __builtin_shufflevector(__s2_199, __s2_199, 1, 0); \
  36774   __ret_199 = __noswap_vcmla_rot270_f32(__rev0_199, __rev1_199, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_199), __p3_199)})); \
  36775   __ret_199 = __builtin_shufflevector(__ret_199, __ret_199, 1, 0); \
  36776   __ret_199; \
  36777 })
  36778 #endif
  36779 
  36780 #ifdef __LITTLE_ENDIAN__
  36781 #define vcmlaq_rot270_lane_f32(__p0_200, __p1_200, __p2_200, __p3_200) __extension__ ({ \
  36782   float32x4_t __ret_200; \
  36783   float32x4_t __s0_200 = __p0_200; \
  36784   float32x4_t __s1_200 = __p1_200; \
  36785   float32x2_t __s2_200 = __p2_200; \
  36786   __ret_200 = vcmlaq_rot270_f32(__s0_200, __s1_200, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_200), __p3_200), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_200), __p3_200)})); \
  36787   __ret_200; \
  36788 })
  36789 #else
  36790 #define vcmlaq_rot270_lane_f32(__p0_201, __p1_201, __p2_201, __p3_201) __extension__ ({ \
  36791   float32x4_t __ret_201; \
  36792   float32x4_t __s0_201 = __p0_201; \
  36793   float32x4_t __s1_201 = __p1_201; \
  36794   float32x2_t __s2_201 = __p2_201; \
  36795   float32x4_t __rev0_201;  __rev0_201 = __builtin_shufflevector(__s0_201, __s0_201, 3, 2, 1, 0); \
  36796   float32x4_t __rev1_201;  __rev1_201 = __builtin_shufflevector(__s1_201, __s1_201, 3, 2, 1, 0); \
  36797   float32x2_t __rev2_201;  __rev2_201 = __builtin_shufflevector(__s2_201, __s2_201, 1, 0); \
  36798   __ret_201 = __noswap_vcmlaq_rot270_f32(__rev0_201, __rev1_201, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_201), __p3_201), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_201), __p3_201)})); \
  36799   __ret_201 = __builtin_shufflevector(__ret_201, __ret_201, 3, 2, 1, 0); \
  36800   __ret_201; \
  36801 })
  36802 #endif
  36803 
  36804 #ifdef __LITTLE_ENDIAN__
  36805 #define vcmla_rot270_laneq_f32(__p0_202, __p1_202, __p2_202, __p3_202) __extension__ ({ \
  36806   float32x2_t __ret_202; \
  36807   float32x2_t __s0_202 = __p0_202; \
  36808   float32x2_t __s1_202 = __p1_202; \
  36809   float32x4_t __s2_202 = __p2_202; \
  36810   __ret_202 = vcmla_rot270_f32(__s0_202, __s1_202, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_202), __p3_202)})); \
  36811   __ret_202; \
  36812 })
  36813 #else
  36814 #define vcmla_rot270_laneq_f32(__p0_203, __p1_203, __p2_203, __p3_203) __extension__ ({ \
  36815   float32x2_t __ret_203; \
  36816   float32x2_t __s0_203 = __p0_203; \
  36817   float32x2_t __s1_203 = __p1_203; \
  36818   float32x4_t __s2_203 = __p2_203; \
  36819   float32x2_t __rev0_203;  __rev0_203 = __builtin_shufflevector(__s0_203, __s0_203, 1, 0); \
  36820   float32x2_t __rev1_203;  __rev1_203 = __builtin_shufflevector(__s1_203, __s1_203, 1, 0); \
  36821   float32x4_t __rev2_203;  __rev2_203 = __builtin_shufflevector(__s2_203, __s2_203, 3, 2, 1, 0); \
  36822   __ret_203 = __noswap_vcmla_rot270_f32(__rev0_203, __rev1_203, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_203), __p3_203)})); \
  36823   __ret_203 = __builtin_shufflevector(__ret_203, __ret_203, 1, 0); \
  36824   __ret_203; \
  36825 })
  36826 #endif
  36827 
  36828 #ifdef __LITTLE_ENDIAN__
  36829 #define vcmlaq_rot270_laneq_f32(__p0_204, __p1_204, __p2_204, __p3_204) __extension__ ({ \
  36830   float32x4_t __ret_204; \
  36831   float32x4_t __s0_204 = __p0_204; \
  36832   float32x4_t __s1_204 = __p1_204; \
  36833   float32x4_t __s2_204 = __p2_204; \
  36834   __ret_204 = vcmlaq_rot270_f32(__s0_204, __s1_204, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_204), __p3_204), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_204), __p3_204)})); \
  36835   __ret_204; \
  36836 })
  36837 #else
  36838 #define vcmlaq_rot270_laneq_f32(__p0_205, __p1_205, __p2_205, __p3_205) __extension__ ({ \
  36839   float32x4_t __ret_205; \
  36840   float32x4_t __s0_205 = __p0_205; \
  36841   float32x4_t __s1_205 = __p1_205; \
  36842   float32x4_t __s2_205 = __p2_205; \
  36843   float32x4_t __rev0_205;  __rev0_205 = __builtin_shufflevector(__s0_205, __s0_205, 3, 2, 1, 0); \
  36844   float32x4_t __rev1_205;  __rev1_205 = __builtin_shufflevector(__s1_205, __s1_205, 3, 2, 1, 0); \
  36845   float32x4_t __rev2_205;  __rev2_205 = __builtin_shufflevector(__s2_205, __s2_205, 3, 2, 1, 0); \
  36846   __ret_205 = __noswap_vcmlaq_rot270_f32(__rev0_205, __rev1_205, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_205), __p3_205), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_205), __p3_205)})); \
  36847   __ret_205 = __builtin_shufflevector(__ret_205, __ret_205, 3, 2, 1, 0); \
  36848   __ret_205; \
  36849 })
  36850 #endif
  36851 
  36852 #ifdef __LITTLE_ENDIAN__
  36853 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot90_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36854   float32x4_t __ret;
  36855   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot90_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36856   return __ret;
  36857 }
  36858 #else
  36859 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot90_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36860   float32x4_t __ret;
  36861   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  36862   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  36863   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  36864   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot90_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  36865   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  36866   return __ret;
  36867 }
  36868 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_rot90_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  36869   float32x4_t __ret;
  36870   __ret = (float32x4_t) __builtin_neon_vcmlaq_rot90_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  36871   return __ret;
  36872 }
  36873 #endif
  36874 
  36875 #ifdef __LITTLE_ENDIAN__
  36876 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot90_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36877   float32x2_t __ret;
  36878   __ret = (float32x2_t) __builtin_neon_vcmla_rot90_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36879   return __ret;
  36880 }
  36881 #else
  36882 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot90_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36883   float32x2_t __ret;
  36884   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  36885   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  36886   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  36887   __ret = (float32x2_t) __builtin_neon_vcmla_rot90_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  36888   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  36889   return __ret;
  36890 }
  36891 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_rot90_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  36892   float32x2_t __ret;
  36893   __ret = (float32x2_t) __builtin_neon_vcmla_rot90_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  36894   return __ret;
  36895 }
  36896 #endif
  36897 
  36898 #ifdef __LITTLE_ENDIAN__
  36899 #define vcmla_rot90_lane_f32(__p0_206, __p1_206, __p2_206, __p3_206) __extension__ ({ \
  36900   float32x2_t __ret_206; \
  36901   float32x2_t __s0_206 = __p0_206; \
  36902   float32x2_t __s1_206 = __p1_206; \
  36903   float32x2_t __s2_206 = __p2_206; \
  36904   __ret_206 = vcmla_rot90_f32(__s0_206, __s1_206, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_206), __p3_206)})); \
  36905   __ret_206; \
  36906 })
  36907 #else
  36908 #define vcmla_rot90_lane_f32(__p0_207, __p1_207, __p2_207, __p3_207) __extension__ ({ \
  36909   float32x2_t __ret_207; \
  36910   float32x2_t __s0_207 = __p0_207; \
  36911   float32x2_t __s1_207 = __p1_207; \
  36912   float32x2_t __s2_207 = __p2_207; \
  36913   float32x2_t __rev0_207;  __rev0_207 = __builtin_shufflevector(__s0_207, __s0_207, 1, 0); \
  36914   float32x2_t __rev1_207;  __rev1_207 = __builtin_shufflevector(__s1_207, __s1_207, 1, 0); \
  36915   float32x2_t __rev2_207;  __rev2_207 = __builtin_shufflevector(__s2_207, __s2_207, 1, 0); \
  36916   __ret_207 = __noswap_vcmla_rot90_f32(__rev0_207, __rev1_207, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_207), __p3_207)})); \
  36917   __ret_207 = __builtin_shufflevector(__ret_207, __ret_207, 1, 0); \
  36918   __ret_207; \
  36919 })
  36920 #endif
  36921 
  36922 #ifdef __LITTLE_ENDIAN__
  36923 #define vcmlaq_rot90_lane_f32(__p0_208, __p1_208, __p2_208, __p3_208) __extension__ ({ \
  36924   float32x4_t __ret_208; \
  36925   float32x4_t __s0_208 = __p0_208; \
  36926   float32x4_t __s1_208 = __p1_208; \
  36927   float32x2_t __s2_208 = __p2_208; \
  36928   __ret_208 = vcmlaq_rot90_f32(__s0_208, __s1_208, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_208), __p3_208), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_208), __p3_208)})); \
  36929   __ret_208; \
  36930 })
  36931 #else
  36932 #define vcmlaq_rot90_lane_f32(__p0_209, __p1_209, __p2_209, __p3_209) __extension__ ({ \
  36933   float32x4_t __ret_209; \
  36934   float32x4_t __s0_209 = __p0_209; \
  36935   float32x4_t __s1_209 = __p1_209; \
  36936   float32x2_t __s2_209 = __p2_209; \
  36937   float32x4_t __rev0_209;  __rev0_209 = __builtin_shufflevector(__s0_209, __s0_209, 3, 2, 1, 0); \
  36938   float32x4_t __rev1_209;  __rev1_209 = __builtin_shufflevector(__s1_209, __s1_209, 3, 2, 1, 0); \
  36939   float32x2_t __rev2_209;  __rev2_209 = __builtin_shufflevector(__s2_209, __s2_209, 1, 0); \
  36940   __ret_209 = __noswap_vcmlaq_rot90_f32(__rev0_209, __rev1_209, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_209), __p3_209), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_209), __p3_209)})); \
  36941   __ret_209 = __builtin_shufflevector(__ret_209, __ret_209, 3, 2, 1, 0); \
  36942   __ret_209; \
  36943 })
  36944 #endif
  36945 
  36946 #ifdef __LITTLE_ENDIAN__
  36947 #define vcmla_rot90_laneq_f32(__p0_210, __p1_210, __p2_210, __p3_210) __extension__ ({ \
  36948   float32x2_t __ret_210; \
  36949   float32x2_t __s0_210 = __p0_210; \
  36950   float32x2_t __s1_210 = __p1_210; \
  36951   float32x4_t __s2_210 = __p2_210; \
  36952   __ret_210 = vcmla_rot90_f32(__s0_210, __s1_210, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_210), __p3_210)})); \
  36953   __ret_210; \
  36954 })
  36955 #else
  36956 #define vcmla_rot90_laneq_f32(__p0_211, __p1_211, __p2_211, __p3_211) __extension__ ({ \
  36957   float32x2_t __ret_211; \
  36958   float32x2_t __s0_211 = __p0_211; \
  36959   float32x2_t __s1_211 = __p1_211; \
  36960   float32x4_t __s2_211 = __p2_211; \
  36961   float32x2_t __rev0_211;  __rev0_211 = __builtin_shufflevector(__s0_211, __s0_211, 1, 0); \
  36962   float32x2_t __rev1_211;  __rev1_211 = __builtin_shufflevector(__s1_211, __s1_211, 1, 0); \
  36963   float32x4_t __rev2_211;  __rev2_211 = __builtin_shufflevector(__s2_211, __s2_211, 3, 2, 1, 0); \
  36964   __ret_211 = __noswap_vcmla_rot90_f32(__rev0_211, __rev1_211, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_211), __p3_211)})); \
  36965   __ret_211 = __builtin_shufflevector(__ret_211, __ret_211, 1, 0); \
  36966   __ret_211; \
  36967 })
  36968 #endif
  36969 
  36970 #ifdef __LITTLE_ENDIAN__
  36971 #define vcmlaq_rot90_laneq_f32(__p0_212, __p1_212, __p2_212, __p3_212) __extension__ ({ \
  36972   float32x4_t __ret_212; \
  36973   float32x4_t __s0_212 = __p0_212; \
  36974   float32x4_t __s1_212 = __p1_212; \
  36975   float32x4_t __s2_212 = __p2_212; \
  36976   __ret_212 = vcmlaq_rot90_f32(__s0_212, __s1_212, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_212), __p3_212), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_212), __p3_212)})); \
  36977   __ret_212; \
  36978 })
  36979 #else
  36980 #define vcmlaq_rot90_laneq_f32(__p0_213, __p1_213, __p2_213, __p3_213) __extension__ ({ \
  36981   float32x4_t __ret_213; \
  36982   float32x4_t __s0_213 = __p0_213; \
  36983   float32x4_t __s1_213 = __p1_213; \
  36984   float32x4_t __s2_213 = __p2_213; \
  36985   float32x4_t __rev0_213;  __rev0_213 = __builtin_shufflevector(__s0_213, __s0_213, 3, 2, 1, 0); \
  36986   float32x4_t __rev1_213;  __rev1_213 = __builtin_shufflevector(__s1_213, __s1_213, 3, 2, 1, 0); \
  36987   float32x4_t __rev2_213;  __rev2_213 = __builtin_shufflevector(__s2_213, __s2_213, 3, 2, 1, 0); \
  36988   __ret_213 = __noswap_vcmlaq_rot90_f32(__rev0_213, __rev1_213, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_213), __p3_213), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_213), __p3_213)})); \
  36989   __ret_213 = __builtin_shufflevector(__ret_213, __ret_213, 3, 2, 1, 0); \
  36990   __ret_213; \
  36991 })
  36992 #endif
  36993 
  36994 #if !defined(__aarch64__) && !defined(__arm64ec__)
  36995 #ifdef __LITTLE_ENDIAN__
  36996 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __a32_vcvt_bf16_f32(float32x4_t __p0) {
  36997   bfloat16x4_t __ret;
  36998   __ret = (bfloat16x4_t) __builtin_neon___a32_vcvt_bf16_f32((int8x16_t)__p0, 11);
  36999   return __ret;
  37000 }
  37001 #else
  37002 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __a32_vcvt_bf16_f32(float32x4_t __p0) {
  37003   bfloat16x4_t __ret;
  37004   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  37005   __ret = (bfloat16x4_t) __builtin_neon___a32_vcvt_bf16_f32((int8x16_t)__rev0, 11);
  37006   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  37007   return __ret;
  37008 }
  37009 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __noswap___a32_vcvt_bf16_f32(float32x4_t __p0) {
  37010   bfloat16x4_t __ret;
  37011   __ret = (bfloat16x4_t) __builtin_neon___a32_vcvt_bf16_f32((int8x16_t)__p0, 11);
  37012   return __ret;
  37013 }
  37014 #endif
  37015 
  37016 #ifdef __LITTLE_ENDIAN__
  37017 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) {
  37018   bfloat16x4_t __ret;
  37019   __ret = __a32_vcvt_bf16_f32(__p0);
  37020   return __ret;
  37021 }
  37022 #else
  37023 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) {
  37024   bfloat16x4_t __ret;
  37025   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  37026   __ret = __noswap___a32_vcvt_bf16_f32(__rev0);
  37027   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  37028   return __ret;
  37029 }
  37030 #endif
  37031 
  37032 #ifdef __LITTLE_ENDIAN__
  37033 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) {
  37034   bfloat16x8_t __ret;
  37035   __ret = vcombine_bf16(__a32_vcvt_bf16_f32(__p1), vget_low_bf16(__p0));
  37036   return __ret;
  37037 }
  37038 #else
  37039 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) {
  37040   bfloat16x8_t __ret;
  37041   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  37042   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  37043   __ret = __noswap_vcombine_bf16(__noswap___a32_vcvt_bf16_f32(__rev1), __noswap_vget_low_bf16(__rev0));
  37044   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  37045   return __ret;
  37046 }
  37047 #endif
  37048 
  37049 #ifdef __LITTLE_ENDIAN__
  37050 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) {
  37051   bfloat16x8_t __ret;
  37052   __ret = vcombine_bf16((bfloat16x4_t)(0ULL), __a32_vcvt_bf16_f32(__p0));
  37053   return __ret;
  37054 }
  37055 #else
  37056 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) {
  37057   bfloat16x8_t __ret;
  37058   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  37059   __ret = __noswap_vcombine_bf16((bfloat16x4_t)(0ULL), __noswap___a32_vcvt_bf16_f32(__rev0));
  37060   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  37061   return __ret;
  37062 }
  37063 #endif
  37064 
  37065 __ai __attribute__((target("bf16,neon"))) poly8x8_t vreinterpret_p8_bf16(bfloat16x4_t __p0) {
  37066   poly8x8_t __ret;
  37067   __ret = (poly8x8_t)(__p0);
  37068   return __ret;
  37069 }
  37070 __ai __attribute__((target("bf16,neon"))) poly64x1_t vreinterpret_p64_bf16(bfloat16x4_t __p0) {
  37071   poly64x1_t __ret;
  37072   __ret = (poly64x1_t)(__p0);
  37073   return __ret;
  37074 }
  37075 __ai __attribute__((target("bf16,neon"))) poly16x4_t vreinterpret_p16_bf16(bfloat16x4_t __p0) {
  37076   poly16x4_t __ret;
  37077   __ret = (poly16x4_t)(__p0);
  37078   return __ret;
  37079 }
  37080 __ai __attribute__((target("bf16,neon"))) poly8x16_t vreinterpretq_p8_bf16(bfloat16x8_t __p0) {
  37081   poly8x16_t __ret;
  37082   __ret = (poly8x16_t)(__p0);
  37083   return __ret;
  37084 }
  37085 __ai __attribute__((target("bf16,neon"))) poly64x2_t vreinterpretq_p64_bf16(bfloat16x8_t __p0) {
  37086   poly64x2_t __ret;
  37087   __ret = (poly64x2_t)(__p0);
  37088   return __ret;
  37089 }
  37090 __ai __attribute__((target("bf16,neon"))) poly16x8_t vreinterpretq_p16_bf16(bfloat16x8_t __p0) {
  37091   poly16x8_t __ret;
  37092   __ret = (poly16x8_t)(__p0);
  37093   return __ret;
  37094 }
  37095 __ai __attribute__((target("bf16,neon"))) uint8x16_t vreinterpretq_u8_bf16(bfloat16x8_t __p0) {
  37096   uint8x16_t __ret;
  37097   __ret = (uint8x16_t)(__p0);
  37098   return __ret;
  37099 }
  37100 __ai __attribute__((target("bf16,neon"))) uint32x4_t vreinterpretq_u32_bf16(bfloat16x8_t __p0) {
  37101   uint32x4_t __ret;
  37102   __ret = (uint32x4_t)(__p0);
  37103   return __ret;
  37104 }
  37105 __ai __attribute__((target("bf16,neon"))) uint64x2_t vreinterpretq_u64_bf16(bfloat16x8_t __p0) {
  37106   uint64x2_t __ret;
  37107   __ret = (uint64x2_t)(__p0);
  37108   return __ret;
  37109 }
  37110 __ai __attribute__((target("bf16,neon"))) uint16x8_t vreinterpretq_u16_bf16(bfloat16x8_t __p0) {
  37111   uint16x8_t __ret;
  37112   __ret = (uint16x8_t)(__p0);
  37113   return __ret;
  37114 }
  37115 __ai __attribute__((target("bf16,neon"))) int8x16_t vreinterpretq_s8_bf16(bfloat16x8_t __p0) {
  37116   int8x16_t __ret;
  37117   __ret = (int8x16_t)(__p0);
  37118   return __ret;
  37119 }
  37120 __ai __attribute__((target("bf16,neon"))) float32x4_t vreinterpretq_f32_bf16(bfloat16x8_t __p0) {
  37121   float32x4_t __ret;
  37122   __ret = (float32x4_t)(__p0);
  37123   return __ret;
  37124 }
  37125 __ai __attribute__((target("bf16,neon"))) float16x8_t vreinterpretq_f16_bf16(bfloat16x8_t __p0) {
  37126   float16x8_t __ret;
  37127   __ret = (float16x8_t)(__p0);
  37128   return __ret;
  37129 }
  37130 __ai __attribute__((target("bf16,neon"))) int32x4_t vreinterpretq_s32_bf16(bfloat16x8_t __p0) {
  37131   int32x4_t __ret;
  37132   __ret = (int32x4_t)(__p0);
  37133   return __ret;
  37134 }
  37135 __ai __attribute__((target("bf16,neon"))) int64x2_t vreinterpretq_s64_bf16(bfloat16x8_t __p0) {
  37136   int64x2_t __ret;
  37137   __ret = (int64x2_t)(__p0);
  37138   return __ret;
  37139 }
  37140 __ai __attribute__((target("bf16,neon"))) int16x8_t vreinterpretq_s16_bf16(bfloat16x8_t __p0) {
  37141   int16x8_t __ret;
  37142   __ret = (int16x8_t)(__p0);
  37143   return __ret;
  37144 }
  37145 __ai __attribute__((target("bf16,neon"))) uint8x8_t vreinterpret_u8_bf16(bfloat16x4_t __p0) {
  37146   uint8x8_t __ret;
  37147   __ret = (uint8x8_t)(__p0);
  37148   return __ret;
  37149 }
  37150 __ai __attribute__((target("bf16,neon"))) uint32x2_t vreinterpret_u32_bf16(bfloat16x4_t __p0) {
  37151   uint32x2_t __ret;
  37152   __ret = (uint32x2_t)(__p0);
  37153   return __ret;
  37154 }
  37155 __ai __attribute__((target("bf16,neon"))) uint64x1_t vreinterpret_u64_bf16(bfloat16x4_t __p0) {
  37156   uint64x1_t __ret;
  37157   __ret = (uint64x1_t)(__p0);
  37158   return __ret;
  37159 }
  37160 __ai __attribute__((target("bf16,neon"))) uint16x4_t vreinterpret_u16_bf16(bfloat16x4_t __p0) {
  37161   uint16x4_t __ret;
  37162   __ret = (uint16x4_t)(__p0);
  37163   return __ret;
  37164 }
  37165 __ai __attribute__((target("bf16,neon"))) int8x8_t vreinterpret_s8_bf16(bfloat16x4_t __p0) {
  37166   int8x8_t __ret;
  37167   __ret = (int8x8_t)(__p0);
  37168   return __ret;
  37169 }
  37170 __ai __attribute__((target("bf16,neon"))) float32x2_t vreinterpret_f32_bf16(bfloat16x4_t __p0) {
  37171   float32x2_t __ret;
  37172   __ret = (float32x2_t)(__p0);
  37173   return __ret;
  37174 }
  37175 __ai __attribute__((target("bf16,neon"))) float16x4_t vreinterpret_f16_bf16(bfloat16x4_t __p0) {
  37176   float16x4_t __ret;
  37177   __ret = (float16x4_t)(__p0);
  37178   return __ret;
  37179 }
  37180 __ai __attribute__((target("bf16,neon"))) int32x2_t vreinterpret_s32_bf16(bfloat16x4_t __p0) {
  37181   int32x2_t __ret;
  37182   __ret = (int32x2_t)(__p0);
  37183   return __ret;
  37184 }
  37185 __ai __attribute__((target("bf16,neon"))) int64x1_t vreinterpret_s64_bf16(bfloat16x4_t __p0) {
  37186   int64x1_t __ret;
  37187   __ret = (int64x1_t)(__p0);
  37188   return __ret;
  37189 }
  37190 __ai __attribute__((target("bf16,neon"))) int16x4_t vreinterpret_s16_bf16(bfloat16x4_t __p0) {
  37191   int16x4_t __ret;
  37192   __ret = (int16x4_t)(__p0);
  37193   return __ret;
  37194 }
  37195 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p8(poly8x16_t __p0) {
  37196   bfloat16x8_t __ret;
  37197   __ret = (bfloat16x8_t)(__p0);
  37198   return __ret;
  37199 }
  37200 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p64(poly64x2_t __p0) {
  37201   bfloat16x8_t __ret;
  37202   __ret = (bfloat16x8_t)(__p0);
  37203   return __ret;
  37204 }
  37205 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p16(poly16x8_t __p0) {
  37206   bfloat16x8_t __ret;
  37207   __ret = (bfloat16x8_t)(__p0);
  37208   return __ret;
  37209 }
  37210 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u8(uint8x16_t __p0) {
  37211   bfloat16x8_t __ret;
  37212   __ret = (bfloat16x8_t)(__p0);
  37213   return __ret;
  37214 }
  37215 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u32(uint32x4_t __p0) {
  37216   bfloat16x8_t __ret;
  37217   __ret = (bfloat16x8_t)(__p0);
  37218   return __ret;
  37219 }
  37220 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u64(uint64x2_t __p0) {
  37221   bfloat16x8_t __ret;
  37222   __ret = (bfloat16x8_t)(__p0);
  37223   return __ret;
  37224 }
  37225 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u16(uint16x8_t __p0) {
  37226   bfloat16x8_t __ret;
  37227   __ret = (bfloat16x8_t)(__p0);
  37228   return __ret;
  37229 }
  37230 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s8(int8x16_t __p0) {
  37231   bfloat16x8_t __ret;
  37232   __ret = (bfloat16x8_t)(__p0);
  37233   return __ret;
  37234 }
  37235 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f32(float32x4_t __p0) {
  37236   bfloat16x8_t __ret;
  37237   __ret = (bfloat16x8_t)(__p0);
  37238   return __ret;
  37239 }
  37240 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f16(float16x8_t __p0) {
  37241   bfloat16x8_t __ret;
  37242   __ret = (bfloat16x8_t)(__p0);
  37243   return __ret;
  37244 }
  37245 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s32(int32x4_t __p0) {
  37246   bfloat16x8_t __ret;
  37247   __ret = (bfloat16x8_t)(__p0);
  37248   return __ret;
  37249 }
  37250 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s64(int64x2_t __p0) {
  37251   bfloat16x8_t __ret;
  37252   __ret = (bfloat16x8_t)(__p0);
  37253   return __ret;
  37254 }
  37255 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s16(int16x8_t __p0) {
  37256   bfloat16x8_t __ret;
  37257   __ret = (bfloat16x8_t)(__p0);
  37258   return __ret;
  37259 }
  37260 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p8(poly8x8_t __p0) {
  37261   bfloat16x4_t __ret;
  37262   __ret = (bfloat16x4_t)(__p0);
  37263   return __ret;
  37264 }
  37265 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p64(poly64x1_t __p0) {
  37266   bfloat16x4_t __ret;
  37267   __ret = (bfloat16x4_t)(__p0);
  37268   return __ret;
  37269 }
  37270 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p16(poly16x4_t __p0) {
  37271   bfloat16x4_t __ret;
  37272   __ret = (bfloat16x4_t)(__p0);
  37273   return __ret;
  37274 }
  37275 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u8(uint8x8_t __p0) {
  37276   bfloat16x4_t __ret;
  37277   __ret = (bfloat16x4_t)(__p0);
  37278   return __ret;
  37279 }
  37280 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u32(uint32x2_t __p0) {
  37281   bfloat16x4_t __ret;
  37282   __ret = (bfloat16x4_t)(__p0);
  37283   return __ret;
  37284 }
  37285 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u64(uint64x1_t __p0) {
  37286   bfloat16x4_t __ret;
  37287   __ret = (bfloat16x4_t)(__p0);
  37288   return __ret;
  37289 }
  37290 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u16(uint16x4_t __p0) {
  37291   bfloat16x4_t __ret;
  37292   __ret = (bfloat16x4_t)(__p0);
  37293   return __ret;
  37294 }
  37295 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s8(int8x8_t __p0) {
  37296   bfloat16x4_t __ret;
  37297   __ret = (bfloat16x4_t)(__p0);
  37298   return __ret;
  37299 }
  37300 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f32(float32x2_t __p0) {
  37301   bfloat16x4_t __ret;
  37302   __ret = (bfloat16x4_t)(__p0);
  37303   return __ret;
  37304 }
  37305 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f16(float16x4_t __p0) {
  37306   bfloat16x4_t __ret;
  37307   __ret = (bfloat16x4_t)(__p0);
  37308   return __ret;
  37309 }
  37310 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s32(int32x2_t __p0) {
  37311   bfloat16x4_t __ret;
  37312   __ret = (bfloat16x4_t)(__p0);
  37313   return __ret;
  37314 }
  37315 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s64(int64x1_t __p0) {
  37316   bfloat16x4_t __ret;
  37317   __ret = (bfloat16x4_t)(__p0);
  37318   return __ret;
  37319 }
  37320 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s16(int16x4_t __p0) {
  37321   bfloat16x4_t __ret;
  37322   __ret = (bfloat16x4_t)(__p0);
  37323   return __ret;
  37324 }
  37325 #ifdef __LITTLE_ENDIAN__
  37326 #define vqdmulhq_lane_s32(__p0_214, __p1_214, __p2_214) __extension__ ({ \
  37327   int32x4_t __ret_214; \
  37328   int32x4_t __s0_214 = __p0_214; \
  37329   int32x2_t __s1_214 = __p1_214; \
  37330   __ret_214 = vqdmulhq_s32(__s0_214, splatq_lane_s32(__s1_214, __p2_214)); \
  37331   __ret_214; \
  37332 })
  37333 #else
  37334 #define vqdmulhq_lane_s32(__p0_215, __p1_215, __p2_215) __extension__ ({ \
  37335   int32x4_t __ret_215; \
  37336   int32x4_t __s0_215 = __p0_215; \
  37337   int32x2_t __s1_215 = __p1_215; \
  37338   int32x4_t __rev0_215;  __rev0_215 = __builtin_shufflevector(__s0_215, __s0_215, 3, 2, 1, 0); \
  37339   int32x2_t __rev1_215;  __rev1_215 = __builtin_shufflevector(__s1_215, __s1_215, 1, 0); \
  37340   __ret_215 = __noswap_vqdmulhq_s32(__rev0_215, __noswap_splatq_lane_s32(__rev1_215, __p2_215)); \
  37341   __ret_215 = __builtin_shufflevector(__ret_215, __ret_215, 3, 2, 1, 0); \
  37342   __ret_215; \
  37343 })
  37344 #endif
  37345 
  37346 #ifdef __LITTLE_ENDIAN__
  37347 #define vqdmulhq_lane_s16(__p0_216, __p1_216, __p2_216) __extension__ ({ \
  37348   int16x8_t __ret_216; \
  37349   int16x8_t __s0_216 = __p0_216; \
  37350   int16x4_t __s1_216 = __p1_216; \
  37351   __ret_216 = vqdmulhq_s16(__s0_216, splatq_lane_s16(__s1_216, __p2_216)); \
  37352   __ret_216; \
  37353 })
  37354 #else
  37355 #define vqdmulhq_lane_s16(__p0_217, __p1_217, __p2_217) __extension__ ({ \
  37356   int16x8_t __ret_217; \
  37357   int16x8_t __s0_217 = __p0_217; \
  37358   int16x4_t __s1_217 = __p1_217; \
  37359   int16x8_t __rev0_217;  __rev0_217 = __builtin_shufflevector(__s0_217, __s0_217, 7, 6, 5, 4, 3, 2, 1, 0); \
  37360   int16x4_t __rev1_217;  __rev1_217 = __builtin_shufflevector(__s1_217, __s1_217, 3, 2, 1, 0); \
  37361   __ret_217 = __noswap_vqdmulhq_s16(__rev0_217, __noswap_splatq_lane_s16(__rev1_217, __p2_217)); \
  37362   __ret_217 = __builtin_shufflevector(__ret_217, __ret_217, 7, 6, 5, 4, 3, 2, 1, 0); \
  37363   __ret_217; \
  37364 })
  37365 #endif
  37366 
  37367 #ifdef __LITTLE_ENDIAN__
  37368 #define vqdmulh_lane_s32(__p0_218, __p1_218, __p2_218) __extension__ ({ \
  37369   int32x2_t __ret_218; \
  37370   int32x2_t __s0_218 = __p0_218; \
  37371   int32x2_t __s1_218 = __p1_218; \
  37372   __ret_218 = vqdmulh_s32(__s0_218, splat_lane_s32(__s1_218, __p2_218)); \
  37373   __ret_218; \
  37374 })
  37375 #else
  37376 #define vqdmulh_lane_s32(__p0_219, __p1_219, __p2_219) __extension__ ({ \
  37377   int32x2_t __ret_219; \
  37378   int32x2_t __s0_219 = __p0_219; \
  37379   int32x2_t __s1_219 = __p1_219; \
  37380   int32x2_t __rev0_219;  __rev0_219 = __builtin_shufflevector(__s0_219, __s0_219, 1, 0); \
  37381   int32x2_t __rev1_219;  __rev1_219 = __builtin_shufflevector(__s1_219, __s1_219, 1, 0); \
  37382   __ret_219 = __noswap_vqdmulh_s32(__rev0_219, __noswap_splat_lane_s32(__rev1_219, __p2_219)); \
  37383   __ret_219 = __builtin_shufflevector(__ret_219, __ret_219, 1, 0); \
  37384   __ret_219; \
  37385 })
  37386 #endif
  37387 
  37388 #ifdef __LITTLE_ENDIAN__
  37389 #define vqdmulh_lane_s16(__p0_220, __p1_220, __p2_220) __extension__ ({ \
  37390   int16x4_t __ret_220; \
  37391   int16x4_t __s0_220 = __p0_220; \
  37392   int16x4_t __s1_220 = __p1_220; \
  37393   __ret_220 = vqdmulh_s16(__s0_220, splat_lane_s16(__s1_220, __p2_220)); \
  37394   __ret_220; \
  37395 })
  37396 #else
  37397 #define vqdmulh_lane_s16(__p0_221, __p1_221, __p2_221) __extension__ ({ \
  37398   int16x4_t __ret_221; \
  37399   int16x4_t __s0_221 = __p0_221; \
  37400   int16x4_t __s1_221 = __p1_221; \
  37401   int16x4_t __rev0_221;  __rev0_221 = __builtin_shufflevector(__s0_221, __s0_221, 3, 2, 1, 0); \
  37402   int16x4_t __rev1_221;  __rev1_221 = __builtin_shufflevector(__s1_221, __s1_221, 3, 2, 1, 0); \
  37403   __ret_221 = __noswap_vqdmulh_s16(__rev0_221, __noswap_splat_lane_s16(__rev1_221, __p2_221)); \
  37404   __ret_221 = __builtin_shufflevector(__ret_221, __ret_221, 3, 2, 1, 0); \
  37405   __ret_221; \
  37406 })
  37407 #endif
  37408 
  37409 #ifdef __LITTLE_ENDIAN__
  37410 #define vqrdmulhq_lane_s32(__p0_222, __p1_222, __p2_222) __extension__ ({ \
  37411   int32x4_t __ret_222; \
  37412   int32x4_t __s0_222 = __p0_222; \
  37413   int32x2_t __s1_222 = __p1_222; \
  37414   __ret_222 = vqrdmulhq_s32(__s0_222, splatq_lane_s32(__s1_222, __p2_222)); \
  37415   __ret_222; \
  37416 })
  37417 #else
  37418 #define vqrdmulhq_lane_s32(__p0_223, __p1_223, __p2_223) __extension__ ({ \
  37419   int32x4_t __ret_223; \
  37420   int32x4_t __s0_223 = __p0_223; \
  37421   int32x2_t __s1_223 = __p1_223; \
  37422   int32x4_t __rev0_223;  __rev0_223 = __builtin_shufflevector(__s0_223, __s0_223, 3, 2, 1, 0); \
  37423   int32x2_t __rev1_223;  __rev1_223 = __builtin_shufflevector(__s1_223, __s1_223, 1, 0); \
  37424   __ret_223 = __noswap_vqrdmulhq_s32(__rev0_223, __noswap_splatq_lane_s32(__rev1_223, __p2_223)); \
  37425   __ret_223 = __builtin_shufflevector(__ret_223, __ret_223, 3, 2, 1, 0); \
  37426   __ret_223; \
  37427 })
  37428 #endif
  37429 
  37430 #ifdef __LITTLE_ENDIAN__
  37431 #define vqrdmulhq_lane_s16(__p0_224, __p1_224, __p2_224) __extension__ ({ \
  37432   int16x8_t __ret_224; \
  37433   int16x8_t __s0_224 = __p0_224; \
  37434   int16x4_t __s1_224 = __p1_224; \
  37435   __ret_224 = vqrdmulhq_s16(__s0_224, splatq_lane_s16(__s1_224, __p2_224)); \
  37436   __ret_224; \
  37437 })
  37438 #else
  37439 #define vqrdmulhq_lane_s16(__p0_225, __p1_225, __p2_225) __extension__ ({ \
  37440   int16x8_t __ret_225; \
  37441   int16x8_t __s0_225 = __p0_225; \
  37442   int16x4_t __s1_225 = __p1_225; \
  37443   int16x8_t __rev0_225;  __rev0_225 = __builtin_shufflevector(__s0_225, __s0_225, 7, 6, 5, 4, 3, 2, 1, 0); \
  37444   int16x4_t __rev1_225;  __rev1_225 = __builtin_shufflevector(__s1_225, __s1_225, 3, 2, 1, 0); \
  37445   __ret_225 = __noswap_vqrdmulhq_s16(__rev0_225, __noswap_splatq_lane_s16(__rev1_225, __p2_225)); \
  37446   __ret_225 = __builtin_shufflevector(__ret_225, __ret_225, 7, 6, 5, 4, 3, 2, 1, 0); \
  37447   __ret_225; \
  37448 })
  37449 #endif
  37450 
  37451 #ifdef __LITTLE_ENDIAN__
  37452 #define vqrdmulh_lane_s32(__p0_226, __p1_226, __p2_226) __extension__ ({ \
  37453   int32x2_t __ret_226; \
  37454   int32x2_t __s0_226 = __p0_226; \
  37455   int32x2_t __s1_226 = __p1_226; \
  37456   __ret_226 = vqrdmulh_s32(__s0_226, splat_lane_s32(__s1_226, __p2_226)); \
  37457   __ret_226; \
  37458 })
  37459 #else
  37460 #define vqrdmulh_lane_s32(__p0_227, __p1_227, __p2_227) __extension__ ({ \
  37461   int32x2_t __ret_227; \
  37462   int32x2_t __s0_227 = __p0_227; \
  37463   int32x2_t __s1_227 = __p1_227; \
  37464   int32x2_t __rev0_227;  __rev0_227 = __builtin_shufflevector(__s0_227, __s0_227, 1, 0); \
  37465   int32x2_t __rev1_227;  __rev1_227 = __builtin_shufflevector(__s1_227, __s1_227, 1, 0); \
  37466   __ret_227 = __noswap_vqrdmulh_s32(__rev0_227, __noswap_splat_lane_s32(__rev1_227, __p2_227)); \
  37467   __ret_227 = __builtin_shufflevector(__ret_227, __ret_227, 1, 0); \
  37468   __ret_227; \
  37469 })
  37470 #endif
  37471 
  37472 #ifdef __LITTLE_ENDIAN__
  37473 #define vqrdmulh_lane_s16(__p0_228, __p1_228, __p2_228) __extension__ ({ \
  37474   int16x4_t __ret_228; \
  37475   int16x4_t __s0_228 = __p0_228; \
  37476   int16x4_t __s1_228 = __p1_228; \
  37477   __ret_228 = vqrdmulh_s16(__s0_228, splat_lane_s16(__s1_228, __p2_228)); \
  37478   __ret_228; \
  37479 })
  37480 #else
  37481 #define vqrdmulh_lane_s16(__p0_229, __p1_229, __p2_229) __extension__ ({ \
  37482   int16x4_t __ret_229; \
  37483   int16x4_t __s0_229 = __p0_229; \
  37484   int16x4_t __s1_229 = __p1_229; \
  37485   int16x4_t __rev0_229;  __rev0_229 = __builtin_shufflevector(__s0_229, __s0_229, 3, 2, 1, 0); \
  37486   int16x4_t __rev1_229;  __rev1_229 = __builtin_shufflevector(__s1_229, __s1_229, 3, 2, 1, 0); \
  37487   __ret_229 = __noswap_vqrdmulh_s16(__rev0_229, __noswap_splat_lane_s16(__rev1_229, __p2_229)); \
  37488   __ret_229 = __builtin_shufflevector(__ret_229, __ret_229, 3, 2, 1, 0); \
  37489   __ret_229; \
  37490 })
  37491 #endif
  37492 
  37493 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_p16(poly16x4_t __p0) {
  37494   poly8x8_t __ret;
  37495   __ret = (poly8x8_t)(__p0);
  37496   return __ret;
  37497 }
  37498 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u8(uint8x8_t __p0) {
  37499   poly8x8_t __ret;
  37500   __ret = (poly8x8_t)(__p0);
  37501   return __ret;
  37502 }
  37503 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u32(uint32x2_t __p0) {
  37504   poly8x8_t __ret;
  37505   __ret = (poly8x8_t)(__p0);
  37506   return __ret;
  37507 }
  37508 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u64(uint64x1_t __p0) {
  37509   poly8x8_t __ret;
  37510   __ret = (poly8x8_t)(__p0);
  37511   return __ret;
  37512 }
  37513 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u16(uint16x4_t __p0) {
  37514   poly8x8_t __ret;
  37515   __ret = (poly8x8_t)(__p0);
  37516   return __ret;
  37517 }
  37518 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s8(int8x8_t __p0) {
  37519   poly8x8_t __ret;
  37520   __ret = (poly8x8_t)(__p0);
  37521   return __ret;
  37522 }
  37523 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f32(float32x2_t __p0) {
  37524   poly8x8_t __ret;
  37525   __ret = (poly8x8_t)(__p0);
  37526   return __ret;
  37527 }
  37528 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f16(float16x4_t __p0) {
  37529   poly8x8_t __ret;
  37530   __ret = (poly8x8_t)(__p0);
  37531   return __ret;
  37532 }
  37533 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s32(int32x2_t __p0) {
  37534   poly8x8_t __ret;
  37535   __ret = (poly8x8_t)(__p0);
  37536   return __ret;
  37537 }
  37538 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s64(int64x1_t __p0) {
  37539   poly8x8_t __ret;
  37540   __ret = (poly8x8_t)(__p0);
  37541   return __ret;
  37542 }
  37543 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s16(int16x4_t __p0) {
  37544   poly8x8_t __ret;
  37545   __ret = (poly8x8_t)(__p0);
  37546   return __ret;
  37547 }
  37548 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_p8(poly8x8_t __p0) {
  37549   poly16x4_t __ret;
  37550   __ret = (poly16x4_t)(__p0);
  37551   return __ret;
  37552 }
  37553 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u8(uint8x8_t __p0) {
  37554   poly16x4_t __ret;
  37555   __ret = (poly16x4_t)(__p0);
  37556   return __ret;
  37557 }
  37558 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u32(uint32x2_t __p0) {
  37559   poly16x4_t __ret;
  37560   __ret = (poly16x4_t)(__p0);
  37561   return __ret;
  37562 }
  37563 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u64(uint64x1_t __p0) {
  37564   poly16x4_t __ret;
  37565   __ret = (poly16x4_t)(__p0);
  37566   return __ret;
  37567 }
  37568 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u16(uint16x4_t __p0) {
  37569   poly16x4_t __ret;
  37570   __ret = (poly16x4_t)(__p0);
  37571   return __ret;
  37572 }
  37573 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s8(int8x8_t __p0) {
  37574   poly16x4_t __ret;
  37575   __ret = (poly16x4_t)(__p0);
  37576   return __ret;
  37577 }
  37578 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f32(float32x2_t __p0) {
  37579   poly16x4_t __ret;
  37580   __ret = (poly16x4_t)(__p0);
  37581   return __ret;
  37582 }
  37583 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f16(float16x4_t __p0) {
  37584   poly16x4_t __ret;
  37585   __ret = (poly16x4_t)(__p0);
  37586   return __ret;
  37587 }
  37588 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s32(int32x2_t __p0) {
  37589   poly16x4_t __ret;
  37590   __ret = (poly16x4_t)(__p0);
  37591   return __ret;
  37592 }
  37593 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s64(int64x1_t __p0) {
  37594   poly16x4_t __ret;
  37595   __ret = (poly16x4_t)(__p0);
  37596   return __ret;
  37597 }
  37598 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s16(int16x4_t __p0) {
  37599   poly16x4_t __ret;
  37600   __ret = (poly16x4_t)(__p0);
  37601   return __ret;
  37602 }
  37603 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p16(poly16x8_t __p0) {
  37604   poly8x16_t __ret;
  37605   __ret = (poly8x16_t)(__p0);
  37606   return __ret;
  37607 }
  37608 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u8(uint8x16_t __p0) {
  37609   poly8x16_t __ret;
  37610   __ret = (poly8x16_t)(__p0);
  37611   return __ret;
  37612 }
  37613 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u32(uint32x4_t __p0) {
  37614   poly8x16_t __ret;
  37615   __ret = (poly8x16_t)(__p0);
  37616   return __ret;
  37617 }
  37618 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u64(uint64x2_t __p0) {
  37619   poly8x16_t __ret;
  37620   __ret = (poly8x16_t)(__p0);
  37621   return __ret;
  37622 }
  37623 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u16(uint16x8_t __p0) {
  37624   poly8x16_t __ret;
  37625   __ret = (poly8x16_t)(__p0);
  37626   return __ret;
  37627 }
  37628 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s8(int8x16_t __p0) {
  37629   poly8x16_t __ret;
  37630   __ret = (poly8x16_t)(__p0);
  37631   return __ret;
  37632 }
  37633 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f32(float32x4_t __p0) {
  37634   poly8x16_t __ret;
  37635   __ret = (poly8x16_t)(__p0);
  37636   return __ret;
  37637 }
  37638 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f16(float16x8_t __p0) {
  37639   poly8x16_t __ret;
  37640   __ret = (poly8x16_t)(__p0);
  37641   return __ret;
  37642 }
  37643 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s32(int32x4_t __p0) {
  37644   poly8x16_t __ret;
  37645   __ret = (poly8x16_t)(__p0);
  37646   return __ret;
  37647 }
  37648 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s64(int64x2_t __p0) {
  37649   poly8x16_t __ret;
  37650   __ret = (poly8x16_t)(__p0);
  37651   return __ret;
  37652 }
  37653 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s16(int16x8_t __p0) {
  37654   poly8x16_t __ret;
  37655   __ret = (poly8x16_t)(__p0);
  37656   return __ret;
  37657 }
  37658 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p8(poly8x16_t __p0) {
  37659   poly16x8_t __ret;
  37660   __ret = (poly16x8_t)(__p0);
  37661   return __ret;
  37662 }
  37663 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u8(uint8x16_t __p0) {
  37664   poly16x8_t __ret;
  37665   __ret = (poly16x8_t)(__p0);
  37666   return __ret;
  37667 }
  37668 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u32(uint32x4_t __p0) {
  37669   poly16x8_t __ret;
  37670   __ret = (poly16x8_t)(__p0);
  37671   return __ret;
  37672 }
  37673 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u64(uint64x2_t __p0) {
  37674   poly16x8_t __ret;
  37675   __ret = (poly16x8_t)(__p0);
  37676   return __ret;
  37677 }
  37678 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u16(uint16x8_t __p0) {
  37679   poly16x8_t __ret;
  37680   __ret = (poly16x8_t)(__p0);
  37681   return __ret;
  37682 }
  37683 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s8(int8x16_t __p0) {
  37684   poly16x8_t __ret;
  37685   __ret = (poly16x8_t)(__p0);
  37686   return __ret;
  37687 }
  37688 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f32(float32x4_t __p0) {
  37689   poly16x8_t __ret;
  37690   __ret = (poly16x8_t)(__p0);
  37691   return __ret;
  37692 }
  37693 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f16(float16x8_t __p0) {
  37694   poly16x8_t __ret;
  37695   __ret = (poly16x8_t)(__p0);
  37696   return __ret;
  37697 }
  37698 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s32(int32x4_t __p0) {
  37699   poly16x8_t __ret;
  37700   __ret = (poly16x8_t)(__p0);
  37701   return __ret;
  37702 }
  37703 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s64(int64x2_t __p0) {
  37704   poly16x8_t __ret;
  37705   __ret = (poly16x8_t)(__p0);
  37706   return __ret;
  37707 }
  37708 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s16(int16x8_t __p0) {
  37709   poly16x8_t __ret;
  37710   __ret = (poly16x8_t)(__p0);
  37711   return __ret;
  37712 }
  37713 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p8(poly8x16_t __p0) {
  37714   uint8x16_t __ret;
  37715   __ret = (uint8x16_t)(__p0);
  37716   return __ret;
  37717 }
  37718 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p16(poly16x8_t __p0) {
  37719   uint8x16_t __ret;
  37720   __ret = (uint8x16_t)(__p0);
  37721   return __ret;
  37722 }
  37723 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u32(uint32x4_t __p0) {
  37724   uint8x16_t __ret;
  37725   __ret = (uint8x16_t)(__p0);
  37726   return __ret;
  37727 }
  37728 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u64(uint64x2_t __p0) {
  37729   uint8x16_t __ret;
  37730   __ret = (uint8x16_t)(__p0);
  37731   return __ret;
  37732 }
  37733 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u16(uint16x8_t __p0) {
  37734   uint8x16_t __ret;
  37735   __ret = (uint8x16_t)(__p0);
  37736   return __ret;
  37737 }
  37738 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s8(int8x16_t __p0) {
  37739   uint8x16_t __ret;
  37740   __ret = (uint8x16_t)(__p0);
  37741   return __ret;
  37742 }
  37743 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f32(float32x4_t __p0) {
  37744   uint8x16_t __ret;
  37745   __ret = (uint8x16_t)(__p0);
  37746   return __ret;
  37747 }
  37748 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f16(float16x8_t __p0) {
  37749   uint8x16_t __ret;
  37750   __ret = (uint8x16_t)(__p0);
  37751   return __ret;
  37752 }
  37753 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s32(int32x4_t __p0) {
  37754   uint8x16_t __ret;
  37755   __ret = (uint8x16_t)(__p0);
  37756   return __ret;
  37757 }
  37758 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s64(int64x2_t __p0) {
  37759   uint8x16_t __ret;
  37760   __ret = (uint8x16_t)(__p0);
  37761   return __ret;
  37762 }
  37763 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s16(int16x8_t __p0) {
  37764   uint8x16_t __ret;
  37765   __ret = (uint8x16_t)(__p0);
  37766   return __ret;
  37767 }
  37768 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p8(poly8x16_t __p0) {
  37769   uint32x4_t __ret;
  37770   __ret = (uint32x4_t)(__p0);
  37771   return __ret;
  37772 }
  37773 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p16(poly16x8_t __p0) {
  37774   uint32x4_t __ret;
  37775   __ret = (uint32x4_t)(__p0);
  37776   return __ret;
  37777 }
  37778 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u8(uint8x16_t __p0) {
  37779   uint32x4_t __ret;
  37780   __ret = (uint32x4_t)(__p0);
  37781   return __ret;
  37782 }
  37783 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u64(uint64x2_t __p0) {
  37784   uint32x4_t __ret;
  37785   __ret = (uint32x4_t)(__p0);
  37786   return __ret;
  37787 }
  37788 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u16(uint16x8_t __p0) {
  37789   uint32x4_t __ret;
  37790   __ret = (uint32x4_t)(__p0);
  37791   return __ret;
  37792 }
  37793 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s8(int8x16_t __p0) {
  37794   uint32x4_t __ret;
  37795   __ret = (uint32x4_t)(__p0);
  37796   return __ret;
  37797 }
  37798 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f32(float32x4_t __p0) {
  37799   uint32x4_t __ret;
  37800   __ret = (uint32x4_t)(__p0);
  37801   return __ret;
  37802 }
  37803 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f16(float16x8_t __p0) {
  37804   uint32x4_t __ret;
  37805   __ret = (uint32x4_t)(__p0);
  37806   return __ret;
  37807 }
  37808 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s32(int32x4_t __p0) {
  37809   uint32x4_t __ret;
  37810   __ret = (uint32x4_t)(__p0);
  37811   return __ret;
  37812 }
  37813 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s64(int64x2_t __p0) {
  37814   uint32x4_t __ret;
  37815   __ret = (uint32x4_t)(__p0);
  37816   return __ret;
  37817 }
  37818 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s16(int16x8_t __p0) {
  37819   uint32x4_t __ret;
  37820   __ret = (uint32x4_t)(__p0);
  37821   return __ret;
  37822 }
  37823 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p8(poly8x16_t __p0) {
  37824   uint64x2_t __ret;
  37825   __ret = (uint64x2_t)(__p0);
  37826   return __ret;
  37827 }
  37828 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p16(poly16x8_t __p0) {
  37829   uint64x2_t __ret;
  37830   __ret = (uint64x2_t)(__p0);
  37831   return __ret;
  37832 }
  37833 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u8(uint8x16_t __p0) {
  37834   uint64x2_t __ret;
  37835   __ret = (uint64x2_t)(__p0);
  37836   return __ret;
  37837 }
  37838 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u32(uint32x4_t __p0) {
  37839   uint64x2_t __ret;
  37840   __ret = (uint64x2_t)(__p0);
  37841   return __ret;
  37842 }
  37843 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u16(uint16x8_t __p0) {
  37844   uint64x2_t __ret;
  37845   __ret = (uint64x2_t)(__p0);
  37846   return __ret;
  37847 }
  37848 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s8(int8x16_t __p0) {
  37849   uint64x2_t __ret;
  37850   __ret = (uint64x2_t)(__p0);
  37851   return __ret;
  37852 }
  37853 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f32(float32x4_t __p0) {
  37854   uint64x2_t __ret;
  37855   __ret = (uint64x2_t)(__p0);
  37856   return __ret;
  37857 }
  37858 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f16(float16x8_t __p0) {
  37859   uint64x2_t __ret;
  37860   __ret = (uint64x2_t)(__p0);
  37861   return __ret;
  37862 }
  37863 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s32(int32x4_t __p0) {
  37864   uint64x2_t __ret;
  37865   __ret = (uint64x2_t)(__p0);
  37866   return __ret;
  37867 }
  37868 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s64(int64x2_t __p0) {
  37869   uint64x2_t __ret;
  37870   __ret = (uint64x2_t)(__p0);
  37871   return __ret;
  37872 }
  37873 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s16(int16x8_t __p0) {
  37874   uint64x2_t __ret;
  37875   __ret = (uint64x2_t)(__p0);
  37876   return __ret;
  37877 }
  37878 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p8(poly8x16_t __p0) {
  37879   uint16x8_t __ret;
  37880   __ret = (uint16x8_t)(__p0);
  37881   return __ret;
  37882 }
  37883 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p16(poly16x8_t __p0) {
  37884   uint16x8_t __ret;
  37885   __ret = (uint16x8_t)(__p0);
  37886   return __ret;
  37887 }
  37888 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u8(uint8x16_t __p0) {
  37889   uint16x8_t __ret;
  37890   __ret = (uint16x8_t)(__p0);
  37891   return __ret;
  37892 }
  37893 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u32(uint32x4_t __p0) {
  37894   uint16x8_t __ret;
  37895   __ret = (uint16x8_t)(__p0);
  37896   return __ret;
  37897 }
  37898 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u64(uint64x2_t __p0) {
  37899   uint16x8_t __ret;
  37900   __ret = (uint16x8_t)(__p0);
  37901   return __ret;
  37902 }
  37903 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s8(int8x16_t __p0) {
  37904   uint16x8_t __ret;
  37905   __ret = (uint16x8_t)(__p0);
  37906   return __ret;
  37907 }
  37908 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f32(float32x4_t __p0) {
  37909   uint16x8_t __ret;
  37910   __ret = (uint16x8_t)(__p0);
  37911   return __ret;
  37912 }
  37913 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f16(float16x8_t __p0) {
  37914   uint16x8_t __ret;
  37915   __ret = (uint16x8_t)(__p0);
  37916   return __ret;
  37917 }
  37918 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s32(int32x4_t __p0) {
  37919   uint16x8_t __ret;
  37920   __ret = (uint16x8_t)(__p0);
  37921   return __ret;
  37922 }
  37923 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s64(int64x2_t __p0) {
  37924   uint16x8_t __ret;
  37925   __ret = (uint16x8_t)(__p0);
  37926   return __ret;
  37927 }
  37928 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s16(int16x8_t __p0) {
  37929   uint16x8_t __ret;
  37930   __ret = (uint16x8_t)(__p0);
  37931   return __ret;
  37932 }
  37933 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p8(poly8x16_t __p0) {
  37934   int8x16_t __ret;
  37935   __ret = (int8x16_t)(__p0);
  37936   return __ret;
  37937 }
  37938 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p16(poly16x8_t __p0) {
  37939   int8x16_t __ret;
  37940   __ret = (int8x16_t)(__p0);
  37941   return __ret;
  37942 }
  37943 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u8(uint8x16_t __p0) {
  37944   int8x16_t __ret;
  37945   __ret = (int8x16_t)(__p0);
  37946   return __ret;
  37947 }
  37948 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u32(uint32x4_t __p0) {
  37949   int8x16_t __ret;
  37950   __ret = (int8x16_t)(__p0);
  37951   return __ret;
  37952 }
  37953 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u64(uint64x2_t __p0) {
  37954   int8x16_t __ret;
  37955   __ret = (int8x16_t)(__p0);
  37956   return __ret;
  37957 }
  37958 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u16(uint16x8_t __p0) {
  37959   int8x16_t __ret;
  37960   __ret = (int8x16_t)(__p0);
  37961   return __ret;
  37962 }
  37963 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f32(float32x4_t __p0) {
  37964   int8x16_t __ret;
  37965   __ret = (int8x16_t)(__p0);
  37966   return __ret;
  37967 }
  37968 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f16(float16x8_t __p0) {
  37969   int8x16_t __ret;
  37970   __ret = (int8x16_t)(__p0);
  37971   return __ret;
  37972 }
  37973 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s32(int32x4_t __p0) {
  37974   int8x16_t __ret;
  37975   __ret = (int8x16_t)(__p0);
  37976   return __ret;
  37977 }
  37978 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s64(int64x2_t __p0) {
  37979   int8x16_t __ret;
  37980   __ret = (int8x16_t)(__p0);
  37981   return __ret;
  37982 }
  37983 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s16(int16x8_t __p0) {
  37984   int8x16_t __ret;
  37985   __ret = (int8x16_t)(__p0);
  37986   return __ret;
  37987 }
  37988 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p8(poly8x16_t __p0) {
  37989   float32x4_t __ret;
  37990   __ret = (float32x4_t)(__p0);
  37991   return __ret;
  37992 }
  37993 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p16(poly16x8_t __p0) {
  37994   float32x4_t __ret;
  37995   __ret = (float32x4_t)(__p0);
  37996   return __ret;
  37997 }
  37998 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u8(uint8x16_t __p0) {
  37999   float32x4_t __ret;
  38000   __ret = (float32x4_t)(__p0);
  38001   return __ret;
  38002 }
  38003 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u32(uint32x4_t __p0) {
  38004   float32x4_t __ret;
  38005   __ret = (float32x4_t)(__p0);
  38006   return __ret;
  38007 }
  38008 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u64(uint64x2_t __p0) {
  38009   float32x4_t __ret;
  38010   __ret = (float32x4_t)(__p0);
  38011   return __ret;
  38012 }
  38013 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u16(uint16x8_t __p0) {
  38014   float32x4_t __ret;
  38015   __ret = (float32x4_t)(__p0);
  38016   return __ret;
  38017 }
  38018 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s8(int8x16_t __p0) {
  38019   float32x4_t __ret;
  38020   __ret = (float32x4_t)(__p0);
  38021   return __ret;
  38022 }
  38023 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_f16(float16x8_t __p0) {
  38024   float32x4_t __ret;
  38025   __ret = (float32x4_t)(__p0);
  38026   return __ret;
  38027 }
  38028 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s32(int32x4_t __p0) {
  38029   float32x4_t __ret;
  38030   __ret = (float32x4_t)(__p0);
  38031   return __ret;
  38032 }
  38033 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s64(int64x2_t __p0) {
  38034   float32x4_t __ret;
  38035   __ret = (float32x4_t)(__p0);
  38036   return __ret;
  38037 }
  38038 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s16(int16x8_t __p0) {
  38039   float32x4_t __ret;
  38040   __ret = (float32x4_t)(__p0);
  38041   return __ret;
  38042 }
  38043 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p8(poly8x16_t __p0) {
  38044   float16x8_t __ret;
  38045   __ret = (float16x8_t)(__p0);
  38046   return __ret;
  38047 }
  38048 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p16(poly16x8_t __p0) {
  38049   float16x8_t __ret;
  38050   __ret = (float16x8_t)(__p0);
  38051   return __ret;
  38052 }
  38053 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u8(uint8x16_t __p0) {
  38054   float16x8_t __ret;
  38055   __ret = (float16x8_t)(__p0);
  38056   return __ret;
  38057 }
  38058 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u32(uint32x4_t __p0) {
  38059   float16x8_t __ret;
  38060   __ret = (float16x8_t)(__p0);
  38061   return __ret;
  38062 }
  38063 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u64(uint64x2_t __p0) {
  38064   float16x8_t __ret;
  38065   __ret = (float16x8_t)(__p0);
  38066   return __ret;
  38067 }
  38068 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u16(uint16x8_t __p0) {
  38069   float16x8_t __ret;
  38070   __ret = (float16x8_t)(__p0);
  38071   return __ret;
  38072 }
  38073 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s8(int8x16_t __p0) {
  38074   float16x8_t __ret;
  38075   __ret = (float16x8_t)(__p0);
  38076   return __ret;
  38077 }
  38078 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_f32(float32x4_t __p0) {
  38079   float16x8_t __ret;
  38080   __ret = (float16x8_t)(__p0);
  38081   return __ret;
  38082 }
  38083 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s32(int32x4_t __p0) {
  38084   float16x8_t __ret;
  38085   __ret = (float16x8_t)(__p0);
  38086   return __ret;
  38087 }
  38088 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s64(int64x2_t __p0) {
  38089   float16x8_t __ret;
  38090   __ret = (float16x8_t)(__p0);
  38091   return __ret;
  38092 }
  38093 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s16(int16x8_t __p0) {
  38094   float16x8_t __ret;
  38095   __ret = (float16x8_t)(__p0);
  38096   return __ret;
  38097 }
  38098 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p8(poly8x16_t __p0) {
  38099   int32x4_t __ret;
  38100   __ret = (int32x4_t)(__p0);
  38101   return __ret;
  38102 }
  38103 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p16(poly16x8_t __p0) {
  38104   int32x4_t __ret;
  38105   __ret = (int32x4_t)(__p0);
  38106   return __ret;
  38107 }
  38108 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u8(uint8x16_t __p0) {
  38109   int32x4_t __ret;
  38110   __ret = (int32x4_t)(__p0);
  38111   return __ret;
  38112 }
  38113 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u32(uint32x4_t __p0) {
  38114   int32x4_t __ret;
  38115   __ret = (int32x4_t)(__p0);
  38116   return __ret;
  38117 }
  38118 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u64(uint64x2_t __p0) {
  38119   int32x4_t __ret;
  38120   __ret = (int32x4_t)(__p0);
  38121   return __ret;
  38122 }
  38123 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u16(uint16x8_t __p0) {
  38124   int32x4_t __ret;
  38125   __ret = (int32x4_t)(__p0);
  38126   return __ret;
  38127 }
  38128 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s8(int8x16_t __p0) {
  38129   int32x4_t __ret;
  38130   __ret = (int32x4_t)(__p0);
  38131   return __ret;
  38132 }
  38133 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f32(float32x4_t __p0) {
  38134   int32x4_t __ret;
  38135   __ret = (int32x4_t)(__p0);
  38136   return __ret;
  38137 }
  38138 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f16(float16x8_t __p0) {
  38139   int32x4_t __ret;
  38140   __ret = (int32x4_t)(__p0);
  38141   return __ret;
  38142 }
  38143 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s64(int64x2_t __p0) {
  38144   int32x4_t __ret;
  38145   __ret = (int32x4_t)(__p0);
  38146   return __ret;
  38147 }
  38148 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s16(int16x8_t __p0) {
  38149   int32x4_t __ret;
  38150   __ret = (int32x4_t)(__p0);
  38151   return __ret;
  38152 }
  38153 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p8(poly8x16_t __p0) {
  38154   int64x2_t __ret;
  38155   __ret = (int64x2_t)(__p0);
  38156   return __ret;
  38157 }
  38158 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p16(poly16x8_t __p0) {
  38159   int64x2_t __ret;
  38160   __ret = (int64x2_t)(__p0);
  38161   return __ret;
  38162 }
  38163 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u8(uint8x16_t __p0) {
  38164   int64x2_t __ret;
  38165   __ret = (int64x2_t)(__p0);
  38166   return __ret;
  38167 }
  38168 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u32(uint32x4_t __p0) {
  38169   int64x2_t __ret;
  38170   __ret = (int64x2_t)(__p0);
  38171   return __ret;
  38172 }
  38173 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u64(uint64x2_t __p0) {
  38174   int64x2_t __ret;
  38175   __ret = (int64x2_t)(__p0);
  38176   return __ret;
  38177 }
  38178 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u16(uint16x8_t __p0) {
  38179   int64x2_t __ret;
  38180   __ret = (int64x2_t)(__p0);
  38181   return __ret;
  38182 }
  38183 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s8(int8x16_t __p0) {
  38184   int64x2_t __ret;
  38185   __ret = (int64x2_t)(__p0);
  38186   return __ret;
  38187 }
  38188 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f32(float32x4_t __p0) {
  38189   int64x2_t __ret;
  38190   __ret = (int64x2_t)(__p0);
  38191   return __ret;
  38192 }
  38193 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f16(float16x8_t __p0) {
  38194   int64x2_t __ret;
  38195   __ret = (int64x2_t)(__p0);
  38196   return __ret;
  38197 }
  38198 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s32(int32x4_t __p0) {
  38199   int64x2_t __ret;
  38200   __ret = (int64x2_t)(__p0);
  38201   return __ret;
  38202 }
  38203 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s16(int16x8_t __p0) {
  38204   int64x2_t __ret;
  38205   __ret = (int64x2_t)(__p0);
  38206   return __ret;
  38207 }
  38208 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p8(poly8x16_t __p0) {
  38209   int16x8_t __ret;
  38210   __ret = (int16x8_t)(__p0);
  38211   return __ret;
  38212 }
  38213 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p16(poly16x8_t __p0) {
  38214   int16x8_t __ret;
  38215   __ret = (int16x8_t)(__p0);
  38216   return __ret;
  38217 }
  38218 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u8(uint8x16_t __p0) {
  38219   int16x8_t __ret;
  38220   __ret = (int16x8_t)(__p0);
  38221   return __ret;
  38222 }
  38223 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u32(uint32x4_t __p0) {
  38224   int16x8_t __ret;
  38225   __ret = (int16x8_t)(__p0);
  38226   return __ret;
  38227 }
  38228 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u64(uint64x2_t __p0) {
  38229   int16x8_t __ret;
  38230   __ret = (int16x8_t)(__p0);
  38231   return __ret;
  38232 }
  38233 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u16(uint16x8_t __p0) {
  38234   int16x8_t __ret;
  38235   __ret = (int16x8_t)(__p0);
  38236   return __ret;
  38237 }
  38238 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s8(int8x16_t __p0) {
  38239   int16x8_t __ret;
  38240   __ret = (int16x8_t)(__p0);
  38241   return __ret;
  38242 }
  38243 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f32(float32x4_t __p0) {
  38244   int16x8_t __ret;
  38245   __ret = (int16x8_t)(__p0);
  38246   return __ret;
  38247 }
  38248 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f16(float16x8_t __p0) {
  38249   int16x8_t __ret;
  38250   __ret = (int16x8_t)(__p0);
  38251   return __ret;
  38252 }
  38253 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s32(int32x4_t __p0) {
  38254   int16x8_t __ret;
  38255   __ret = (int16x8_t)(__p0);
  38256   return __ret;
  38257 }
  38258 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s64(int64x2_t __p0) {
  38259   int16x8_t __ret;
  38260   __ret = (int16x8_t)(__p0);
  38261   return __ret;
  38262 }
  38263 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p8(poly8x8_t __p0) {
  38264   uint8x8_t __ret;
  38265   __ret = (uint8x8_t)(__p0);
  38266   return __ret;
  38267 }
  38268 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p16(poly16x4_t __p0) {
  38269   uint8x8_t __ret;
  38270   __ret = (uint8x8_t)(__p0);
  38271   return __ret;
  38272 }
  38273 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u32(uint32x2_t __p0) {
  38274   uint8x8_t __ret;
  38275   __ret = (uint8x8_t)(__p0);
  38276   return __ret;
  38277 }
  38278 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u64(uint64x1_t __p0) {
  38279   uint8x8_t __ret;
  38280   __ret = (uint8x8_t)(__p0);
  38281   return __ret;
  38282 }
  38283 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u16(uint16x4_t __p0) {
  38284   uint8x8_t __ret;
  38285   __ret = (uint8x8_t)(__p0);
  38286   return __ret;
  38287 }
  38288 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s8(int8x8_t __p0) {
  38289   uint8x8_t __ret;
  38290   __ret = (uint8x8_t)(__p0);
  38291   return __ret;
  38292 }
  38293 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f32(float32x2_t __p0) {
  38294   uint8x8_t __ret;
  38295   __ret = (uint8x8_t)(__p0);
  38296   return __ret;
  38297 }
  38298 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f16(float16x4_t __p0) {
  38299   uint8x8_t __ret;
  38300   __ret = (uint8x8_t)(__p0);
  38301   return __ret;
  38302 }
  38303 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s32(int32x2_t __p0) {
  38304   uint8x8_t __ret;
  38305   __ret = (uint8x8_t)(__p0);
  38306   return __ret;
  38307 }
  38308 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s64(int64x1_t __p0) {
  38309   uint8x8_t __ret;
  38310   __ret = (uint8x8_t)(__p0);
  38311   return __ret;
  38312 }
  38313 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s16(int16x4_t __p0) {
  38314   uint8x8_t __ret;
  38315   __ret = (uint8x8_t)(__p0);
  38316   return __ret;
  38317 }
  38318 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p8(poly8x8_t __p0) {
  38319   uint32x2_t __ret;
  38320   __ret = (uint32x2_t)(__p0);
  38321   return __ret;
  38322 }
  38323 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p16(poly16x4_t __p0) {
  38324   uint32x2_t __ret;
  38325   __ret = (uint32x2_t)(__p0);
  38326   return __ret;
  38327 }
  38328 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u8(uint8x8_t __p0) {
  38329   uint32x2_t __ret;
  38330   __ret = (uint32x2_t)(__p0);
  38331   return __ret;
  38332 }
  38333 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u64(uint64x1_t __p0) {
  38334   uint32x2_t __ret;
  38335   __ret = (uint32x2_t)(__p0);
  38336   return __ret;
  38337 }
  38338 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u16(uint16x4_t __p0) {
  38339   uint32x2_t __ret;
  38340   __ret = (uint32x2_t)(__p0);
  38341   return __ret;
  38342 }
  38343 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s8(int8x8_t __p0) {
  38344   uint32x2_t __ret;
  38345   __ret = (uint32x2_t)(__p0);
  38346   return __ret;
  38347 }
  38348 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f32(float32x2_t __p0) {
  38349   uint32x2_t __ret;
  38350   __ret = (uint32x2_t)(__p0);
  38351   return __ret;
  38352 }
  38353 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f16(float16x4_t __p0) {
  38354   uint32x2_t __ret;
  38355   __ret = (uint32x2_t)(__p0);
  38356   return __ret;
  38357 }
  38358 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s32(int32x2_t __p0) {
  38359   uint32x2_t __ret;
  38360   __ret = (uint32x2_t)(__p0);
  38361   return __ret;
  38362 }
  38363 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s64(int64x1_t __p0) {
  38364   uint32x2_t __ret;
  38365   __ret = (uint32x2_t)(__p0);
  38366   return __ret;
  38367 }
  38368 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s16(int16x4_t __p0) {
  38369   uint32x2_t __ret;
  38370   __ret = (uint32x2_t)(__p0);
  38371   return __ret;
  38372 }
  38373 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p8(poly8x8_t __p0) {
  38374   uint64x1_t __ret;
  38375   __ret = (uint64x1_t)(__p0);
  38376   return __ret;
  38377 }
  38378 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p16(poly16x4_t __p0) {
  38379   uint64x1_t __ret;
  38380   __ret = (uint64x1_t)(__p0);
  38381   return __ret;
  38382 }
  38383 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u8(uint8x8_t __p0) {
  38384   uint64x1_t __ret;
  38385   __ret = (uint64x1_t)(__p0);
  38386   return __ret;
  38387 }
  38388 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u32(uint32x2_t __p0) {
  38389   uint64x1_t __ret;
  38390   __ret = (uint64x1_t)(__p0);
  38391   return __ret;
  38392 }
  38393 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u16(uint16x4_t __p0) {
  38394   uint64x1_t __ret;
  38395   __ret = (uint64x1_t)(__p0);
  38396   return __ret;
  38397 }
  38398 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s8(int8x8_t __p0) {
  38399   uint64x1_t __ret;
  38400   __ret = (uint64x1_t)(__p0);
  38401   return __ret;
  38402 }
  38403 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f32(float32x2_t __p0) {
  38404   uint64x1_t __ret;
  38405   __ret = (uint64x1_t)(__p0);
  38406   return __ret;
  38407 }
  38408 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f16(float16x4_t __p0) {
  38409   uint64x1_t __ret;
  38410   __ret = (uint64x1_t)(__p0);
  38411   return __ret;
  38412 }
  38413 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s32(int32x2_t __p0) {
  38414   uint64x1_t __ret;
  38415   __ret = (uint64x1_t)(__p0);
  38416   return __ret;
  38417 }
  38418 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s64(int64x1_t __p0) {
  38419   uint64x1_t __ret;
  38420   __ret = (uint64x1_t)(__p0);
  38421   return __ret;
  38422 }
  38423 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s16(int16x4_t __p0) {
  38424   uint64x1_t __ret;
  38425   __ret = (uint64x1_t)(__p0);
  38426   return __ret;
  38427 }
  38428 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p8(poly8x8_t __p0) {
  38429   uint16x4_t __ret;
  38430   __ret = (uint16x4_t)(__p0);
  38431   return __ret;
  38432 }
  38433 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p16(poly16x4_t __p0) {
  38434   uint16x4_t __ret;
  38435   __ret = (uint16x4_t)(__p0);
  38436   return __ret;
  38437 }
  38438 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u8(uint8x8_t __p0) {
  38439   uint16x4_t __ret;
  38440   __ret = (uint16x4_t)(__p0);
  38441   return __ret;
  38442 }
  38443 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u32(uint32x2_t __p0) {
  38444   uint16x4_t __ret;
  38445   __ret = (uint16x4_t)(__p0);
  38446   return __ret;
  38447 }
  38448 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u64(uint64x1_t __p0) {
  38449   uint16x4_t __ret;
  38450   __ret = (uint16x4_t)(__p0);
  38451   return __ret;
  38452 }
  38453 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s8(int8x8_t __p0) {
  38454   uint16x4_t __ret;
  38455   __ret = (uint16x4_t)(__p0);
  38456   return __ret;
  38457 }
  38458 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f32(float32x2_t __p0) {
  38459   uint16x4_t __ret;
  38460   __ret = (uint16x4_t)(__p0);
  38461   return __ret;
  38462 }
  38463 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f16(float16x4_t __p0) {
  38464   uint16x4_t __ret;
  38465   __ret = (uint16x4_t)(__p0);
  38466   return __ret;
  38467 }
  38468 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s32(int32x2_t __p0) {
  38469   uint16x4_t __ret;
  38470   __ret = (uint16x4_t)(__p0);
  38471   return __ret;
  38472 }
  38473 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s64(int64x1_t __p0) {
  38474   uint16x4_t __ret;
  38475   __ret = (uint16x4_t)(__p0);
  38476   return __ret;
  38477 }
  38478 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s16(int16x4_t __p0) {
  38479   uint16x4_t __ret;
  38480   __ret = (uint16x4_t)(__p0);
  38481   return __ret;
  38482 }
  38483 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p8(poly8x8_t __p0) {
  38484   int8x8_t __ret;
  38485   __ret = (int8x8_t)(__p0);
  38486   return __ret;
  38487 }
  38488 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p16(poly16x4_t __p0) {
  38489   int8x8_t __ret;
  38490   __ret = (int8x8_t)(__p0);
  38491   return __ret;
  38492 }
  38493 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u8(uint8x8_t __p0) {
  38494   int8x8_t __ret;
  38495   __ret = (int8x8_t)(__p0);
  38496   return __ret;
  38497 }
  38498 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u32(uint32x2_t __p0) {
  38499   int8x8_t __ret;
  38500   __ret = (int8x8_t)(__p0);
  38501   return __ret;
  38502 }
  38503 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u64(uint64x1_t __p0) {
  38504   int8x8_t __ret;
  38505   __ret = (int8x8_t)(__p0);
  38506   return __ret;
  38507 }
  38508 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u16(uint16x4_t __p0) {
  38509   int8x8_t __ret;
  38510   __ret = (int8x8_t)(__p0);
  38511   return __ret;
  38512 }
  38513 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f32(float32x2_t __p0) {
  38514   int8x8_t __ret;
  38515   __ret = (int8x8_t)(__p0);
  38516   return __ret;
  38517 }
  38518 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f16(float16x4_t __p0) {
  38519   int8x8_t __ret;
  38520   __ret = (int8x8_t)(__p0);
  38521   return __ret;
  38522 }
  38523 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s32(int32x2_t __p0) {
  38524   int8x8_t __ret;
  38525   __ret = (int8x8_t)(__p0);
  38526   return __ret;
  38527 }
  38528 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s64(int64x1_t __p0) {
  38529   int8x8_t __ret;
  38530   __ret = (int8x8_t)(__p0);
  38531   return __ret;
  38532 }
  38533 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s16(int16x4_t __p0) {
  38534   int8x8_t __ret;
  38535   __ret = (int8x8_t)(__p0);
  38536   return __ret;
  38537 }
  38538 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p8(poly8x8_t __p0) {
  38539   float32x2_t __ret;
  38540   __ret = (float32x2_t)(__p0);
  38541   return __ret;
  38542 }
  38543 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p16(poly16x4_t __p0) {
  38544   float32x2_t __ret;
  38545   __ret = (float32x2_t)(__p0);
  38546   return __ret;
  38547 }
  38548 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u8(uint8x8_t __p0) {
  38549   float32x2_t __ret;
  38550   __ret = (float32x2_t)(__p0);
  38551   return __ret;
  38552 }
  38553 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u32(uint32x2_t __p0) {
  38554   float32x2_t __ret;
  38555   __ret = (float32x2_t)(__p0);
  38556   return __ret;
  38557 }
  38558 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u64(uint64x1_t __p0) {
  38559   float32x2_t __ret;
  38560   __ret = (float32x2_t)(__p0);
  38561   return __ret;
  38562 }
  38563 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u16(uint16x4_t __p0) {
  38564   float32x2_t __ret;
  38565   __ret = (float32x2_t)(__p0);
  38566   return __ret;
  38567 }
  38568 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s8(int8x8_t __p0) {
  38569   float32x2_t __ret;
  38570   __ret = (float32x2_t)(__p0);
  38571   return __ret;
  38572 }
  38573 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_f16(float16x4_t __p0) {
  38574   float32x2_t __ret;
  38575   __ret = (float32x2_t)(__p0);
  38576   return __ret;
  38577 }
  38578 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s32(int32x2_t __p0) {
  38579   float32x2_t __ret;
  38580   __ret = (float32x2_t)(__p0);
  38581   return __ret;
  38582 }
  38583 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s64(int64x1_t __p0) {
  38584   float32x2_t __ret;
  38585   __ret = (float32x2_t)(__p0);
  38586   return __ret;
  38587 }
  38588 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s16(int16x4_t __p0) {
  38589   float32x2_t __ret;
  38590   __ret = (float32x2_t)(__p0);
  38591   return __ret;
  38592 }
  38593 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p8(poly8x8_t __p0) {
  38594   float16x4_t __ret;
  38595   __ret = (float16x4_t)(__p0);
  38596   return __ret;
  38597 }
  38598 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p16(poly16x4_t __p0) {
  38599   float16x4_t __ret;
  38600   __ret = (float16x4_t)(__p0);
  38601   return __ret;
  38602 }
  38603 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u8(uint8x8_t __p0) {
  38604   float16x4_t __ret;
  38605   __ret = (float16x4_t)(__p0);
  38606   return __ret;
  38607 }
  38608 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u32(uint32x2_t __p0) {
  38609   float16x4_t __ret;
  38610   __ret = (float16x4_t)(__p0);
  38611   return __ret;
  38612 }
  38613 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u64(uint64x1_t __p0) {
  38614   float16x4_t __ret;
  38615   __ret = (float16x4_t)(__p0);
  38616   return __ret;
  38617 }
  38618 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u16(uint16x4_t __p0) {
  38619   float16x4_t __ret;
  38620   __ret = (float16x4_t)(__p0);
  38621   return __ret;
  38622 }
  38623 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s8(int8x8_t __p0) {
  38624   float16x4_t __ret;
  38625   __ret = (float16x4_t)(__p0);
  38626   return __ret;
  38627 }
  38628 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_f32(float32x2_t __p0) {
  38629   float16x4_t __ret;
  38630   __ret = (float16x4_t)(__p0);
  38631   return __ret;
  38632 }
  38633 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s32(int32x2_t __p0) {
  38634   float16x4_t __ret;
  38635   __ret = (float16x4_t)(__p0);
  38636   return __ret;
  38637 }
  38638 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s64(int64x1_t __p0) {
  38639   float16x4_t __ret;
  38640   __ret = (float16x4_t)(__p0);
  38641   return __ret;
  38642 }
  38643 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s16(int16x4_t __p0) {
  38644   float16x4_t __ret;
  38645   __ret = (float16x4_t)(__p0);
  38646   return __ret;
  38647 }
  38648 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p8(poly8x8_t __p0) {
  38649   int32x2_t __ret;
  38650   __ret = (int32x2_t)(__p0);
  38651   return __ret;
  38652 }
  38653 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p16(poly16x4_t __p0) {
  38654   int32x2_t __ret;
  38655   __ret = (int32x2_t)(__p0);
  38656   return __ret;
  38657 }
  38658 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u8(uint8x8_t __p0) {
  38659   int32x2_t __ret;
  38660   __ret = (int32x2_t)(__p0);
  38661   return __ret;
  38662 }
  38663 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u32(uint32x2_t __p0) {
  38664   int32x2_t __ret;
  38665   __ret = (int32x2_t)(__p0);
  38666   return __ret;
  38667 }
  38668 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u64(uint64x1_t __p0) {
  38669   int32x2_t __ret;
  38670   __ret = (int32x2_t)(__p0);
  38671   return __ret;
  38672 }
  38673 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u16(uint16x4_t __p0) {
  38674   int32x2_t __ret;
  38675   __ret = (int32x2_t)(__p0);
  38676   return __ret;
  38677 }
  38678 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s8(int8x8_t __p0) {
  38679   int32x2_t __ret;
  38680   __ret = (int32x2_t)(__p0);
  38681   return __ret;
  38682 }
  38683 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f32(float32x2_t __p0) {
  38684   int32x2_t __ret;
  38685   __ret = (int32x2_t)(__p0);
  38686   return __ret;
  38687 }
  38688 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f16(float16x4_t __p0) {
  38689   int32x2_t __ret;
  38690   __ret = (int32x2_t)(__p0);
  38691   return __ret;
  38692 }
  38693 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s64(int64x1_t __p0) {
  38694   int32x2_t __ret;
  38695   __ret = (int32x2_t)(__p0);
  38696   return __ret;
  38697 }
  38698 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s16(int16x4_t __p0) {
  38699   int32x2_t __ret;
  38700   __ret = (int32x2_t)(__p0);
  38701   return __ret;
  38702 }
  38703 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p8(poly8x8_t __p0) {
  38704   int64x1_t __ret;
  38705   __ret = (int64x1_t)(__p0);
  38706   return __ret;
  38707 }
  38708 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p16(poly16x4_t __p0) {
  38709   int64x1_t __ret;
  38710   __ret = (int64x1_t)(__p0);
  38711   return __ret;
  38712 }
  38713 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u8(uint8x8_t __p0) {
  38714   int64x1_t __ret;
  38715   __ret = (int64x1_t)(__p0);
  38716   return __ret;
  38717 }
  38718 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u32(uint32x2_t __p0) {
  38719   int64x1_t __ret;
  38720   __ret = (int64x1_t)(__p0);
  38721   return __ret;
  38722 }
  38723 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u64(uint64x1_t __p0) {
  38724   int64x1_t __ret;
  38725   __ret = (int64x1_t)(__p0);
  38726   return __ret;
  38727 }
  38728 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u16(uint16x4_t __p0) {
  38729   int64x1_t __ret;
  38730   __ret = (int64x1_t)(__p0);
  38731   return __ret;
  38732 }
  38733 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s8(int8x8_t __p0) {
  38734   int64x1_t __ret;
  38735   __ret = (int64x1_t)(__p0);
  38736   return __ret;
  38737 }
  38738 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f32(float32x2_t __p0) {
  38739   int64x1_t __ret;
  38740   __ret = (int64x1_t)(__p0);
  38741   return __ret;
  38742 }
  38743 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f16(float16x4_t __p0) {
  38744   int64x1_t __ret;
  38745   __ret = (int64x1_t)(__p0);
  38746   return __ret;
  38747 }
  38748 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s32(int32x2_t __p0) {
  38749   int64x1_t __ret;
  38750   __ret = (int64x1_t)(__p0);
  38751   return __ret;
  38752 }
  38753 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s16(int16x4_t __p0) {
  38754   int64x1_t __ret;
  38755   __ret = (int64x1_t)(__p0);
  38756   return __ret;
  38757 }
  38758 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p8(poly8x8_t __p0) {
  38759   int16x4_t __ret;
  38760   __ret = (int16x4_t)(__p0);
  38761   return __ret;
  38762 }
  38763 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p16(poly16x4_t __p0) {
  38764   int16x4_t __ret;
  38765   __ret = (int16x4_t)(__p0);
  38766   return __ret;
  38767 }
  38768 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u8(uint8x8_t __p0) {
  38769   int16x4_t __ret;
  38770   __ret = (int16x4_t)(__p0);
  38771   return __ret;
  38772 }
  38773 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u32(uint32x2_t __p0) {
  38774   int16x4_t __ret;
  38775   __ret = (int16x4_t)(__p0);
  38776   return __ret;
  38777 }
  38778 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u64(uint64x1_t __p0) {
  38779   int16x4_t __ret;
  38780   __ret = (int16x4_t)(__p0);
  38781   return __ret;
  38782 }
  38783 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u16(uint16x4_t __p0) {
  38784   int16x4_t __ret;
  38785   __ret = (int16x4_t)(__p0);
  38786   return __ret;
  38787 }
  38788 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s8(int8x8_t __p0) {
  38789   int16x4_t __ret;
  38790   __ret = (int16x4_t)(__p0);
  38791   return __ret;
  38792 }
  38793 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f32(float32x2_t __p0) {
  38794   int16x4_t __ret;
  38795   __ret = (int16x4_t)(__p0);
  38796   return __ret;
  38797 }
  38798 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f16(float16x4_t __p0) {
  38799   int16x4_t __ret;
  38800   __ret = (int16x4_t)(__p0);
  38801   return __ret;
  38802 }
  38803 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s32(int32x2_t __p0) {
  38804   int16x4_t __ret;
  38805   __ret = (int16x4_t)(__p0);
  38806   return __ret;
  38807 }
  38808 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s64(int64x1_t __p0) {
  38809   int16x4_t __ret;
  38810   __ret = (int16x4_t)(__p0);
  38811   return __ret;
  38812 }
  38813 #endif
  38814 #if (__ARM_FP & 2)
  38815 #ifdef __LITTLE_ENDIAN__
  38816 __ai __attribute__((target("neon"))) float16x4_t vcvt_f16_f32(float32x4_t __p0) {
  38817   float16x4_t __ret;
  38818   __ret = (float16x4_t) __builtin_neon_vcvt_f16_f32((int8x16_t)__p0, 41);
  38819   return __ret;
  38820 }
  38821 #else
  38822 __ai __attribute__((target("neon"))) float16x4_t vcvt_f16_f32(float32x4_t __p0) {
  38823   float16x4_t __ret;
  38824   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  38825   __ret = (float16x4_t) __builtin_neon_vcvt_f16_f32((int8x16_t)__rev0, 41);
  38826   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  38827   return __ret;
  38828 }
  38829 __ai __attribute__((target("neon"))) float16x4_t __noswap_vcvt_f16_f32(float32x4_t __p0) {
  38830   float16x4_t __ret;
  38831   __ret = (float16x4_t) __builtin_neon_vcvt_f16_f32((int8x16_t)__p0, 41);
  38832   return __ret;
  38833 }
  38834 #endif
  38835 
  38836 #ifdef __LITTLE_ENDIAN__
  38837 __ai __attribute__((target("neon"))) float32x4_t vcvt_f32_f16(float16x4_t __p0) {
  38838   float32x4_t __ret;
  38839   __ret = (float32x4_t) __builtin_neon_vcvt_f32_f16((int8x8_t)__p0, 8);
  38840   return __ret;
  38841 }
  38842 #else
  38843 __ai __attribute__((target("neon"))) float32x4_t vcvt_f32_f16(float16x4_t __p0) {
  38844   float32x4_t __ret;
  38845   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  38846   __ret = (float32x4_t) __builtin_neon_vcvt_f32_f16((int8x8_t)__rev0, 8);
  38847   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  38848   return __ret;
  38849 }
  38850 __ai __attribute__((target("neon"))) float32x4_t __noswap_vcvt_f32_f16(float16x4_t __p0) {
  38851   float32x4_t __ret;
  38852   __ret = (float32x4_t) __builtin_neon_vcvt_f32_f16((int8x8_t)__p0, 8);
  38853   return __ret;
  38854 }
  38855 #endif
  38856 
  38857 #ifdef __LITTLE_ENDIAN__
  38858 #define vld1q_f16(__p0) __extension__ ({ \
  38859   float16x8_t __ret; \
  38860   __ret = (float16x8_t) __builtin_neon_vld1q_v(__p0, 40); \
  38861   __ret; \
  38862 })
  38863 #else
  38864 #define vld1q_f16(__p0) __extension__ ({ \
  38865   float16x8_t __ret; \
  38866   __ret = (float16x8_t) __builtin_neon_vld1q_v(__p0, 40); \
  38867   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  38868   __ret; \
  38869 })
  38870 #endif
  38871 
  38872 #ifdef __LITTLE_ENDIAN__
  38873 #define vld1_f16(__p0) __extension__ ({ \
  38874   float16x4_t __ret; \
  38875   __ret = (float16x4_t) __builtin_neon_vld1_v(__p0, 8); \
  38876   __ret; \
  38877 })
  38878 #else
  38879 #define vld1_f16(__p0) __extension__ ({ \
  38880   float16x4_t __ret; \
  38881   __ret = (float16x4_t) __builtin_neon_vld1_v(__p0, 8); \
  38882   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  38883   __ret; \
  38884 })
  38885 #endif
  38886 
  38887 #ifdef __LITTLE_ENDIAN__
  38888 #define vld1q_dup_f16(__p0) __extension__ ({ \
  38889   float16x8_t __ret; \
  38890   __ret = (float16x8_t) __builtin_neon_vld1q_dup_v(__p0, 40); \
  38891   __ret; \
  38892 })
  38893 #else
  38894 #define vld1q_dup_f16(__p0) __extension__ ({ \
  38895   float16x8_t __ret; \
  38896   __ret = (float16x8_t) __builtin_neon_vld1q_dup_v(__p0, 40); \
  38897   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  38898   __ret; \
  38899 })
  38900 #endif
  38901 
  38902 #ifdef __LITTLE_ENDIAN__
  38903 #define vld1_dup_f16(__p0) __extension__ ({ \
  38904   float16x4_t __ret; \
  38905   __ret = (float16x4_t) __builtin_neon_vld1_dup_v(__p0, 8); \
  38906   __ret; \
  38907 })
  38908 #else
  38909 #define vld1_dup_f16(__p0) __extension__ ({ \
  38910   float16x4_t __ret; \
  38911   __ret = (float16x4_t) __builtin_neon_vld1_dup_v(__p0, 8); \
  38912   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  38913   __ret; \
  38914 })
  38915 #endif
  38916 
  38917 #ifdef __LITTLE_ENDIAN__
  38918 #define vld1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  38919   float16x8_t __ret; \
  38920   float16x8_t __s1 = __p1; \
  38921   __ret = (float16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 40); \
  38922   __ret; \
  38923 })
  38924 #else
  38925 #define vld1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  38926   float16x8_t __ret; \
  38927   float16x8_t __s1 = __p1; \
  38928   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  38929   __ret = (float16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 40); \
  38930   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  38931   __ret; \
  38932 })
  38933 #endif
  38934 
  38935 #ifdef __LITTLE_ENDIAN__
  38936 #define vld1_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  38937   float16x4_t __ret; \
  38938   float16x4_t __s1 = __p1; \
  38939   __ret = (float16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 8); \
  38940   __ret; \
  38941 })
  38942 #else
  38943 #define vld1_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  38944   float16x4_t __ret; \
  38945   float16x4_t __s1 = __p1; \
  38946   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  38947   __ret = (float16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 8); \
  38948   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  38949   __ret; \
  38950 })
  38951 #endif
  38952 
  38953 #ifdef __LITTLE_ENDIAN__
  38954 #define vld1q_f16_x2(__p0) __extension__ ({ \
  38955   float16x8x2_t __ret; \
  38956   __builtin_neon_vld1q_x2_v(&__ret, __p0, 40); \
  38957   __ret; \
  38958 })
  38959 #else
  38960 #define vld1q_f16_x2(__p0) __extension__ ({ \
  38961   float16x8x2_t __ret; \
  38962   __builtin_neon_vld1q_x2_v(&__ret, __p0, 40); \
  38963  \
  38964   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  38965   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  38966   __ret; \
  38967 })
  38968 #endif
  38969 
  38970 #ifdef __LITTLE_ENDIAN__
  38971 #define vld1_f16_x2(__p0) __extension__ ({ \
  38972   float16x4x2_t __ret; \
  38973   __builtin_neon_vld1_x2_v(&__ret, __p0, 8); \
  38974   __ret; \
  38975 })
  38976 #else
  38977 #define vld1_f16_x2(__p0) __extension__ ({ \
  38978   float16x4x2_t __ret; \
  38979   __builtin_neon_vld1_x2_v(&__ret, __p0, 8); \
  38980  \
  38981   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  38982   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  38983   __ret; \
  38984 })
  38985 #endif
  38986 
  38987 #ifdef __LITTLE_ENDIAN__
  38988 #define vld1q_f16_x3(__p0) __extension__ ({ \
  38989   float16x8x3_t __ret; \
  38990   __builtin_neon_vld1q_x3_v(&__ret, __p0, 40); \
  38991   __ret; \
  38992 })
  38993 #else
  38994 #define vld1q_f16_x3(__p0) __extension__ ({ \
  38995   float16x8x3_t __ret; \
  38996   __builtin_neon_vld1q_x3_v(&__ret, __p0, 40); \
  38997  \
  38998   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  38999   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39000   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39001   __ret; \
  39002 })
  39003 #endif
  39004 
  39005 #ifdef __LITTLE_ENDIAN__
  39006 #define vld1_f16_x3(__p0) __extension__ ({ \
  39007   float16x4x3_t __ret; \
  39008   __builtin_neon_vld1_x3_v(&__ret, __p0, 8); \
  39009   __ret; \
  39010 })
  39011 #else
  39012 #define vld1_f16_x3(__p0) __extension__ ({ \
  39013   float16x4x3_t __ret; \
  39014   __builtin_neon_vld1_x3_v(&__ret, __p0, 8); \
  39015  \
  39016   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39017   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39018   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39019   __ret; \
  39020 })
  39021 #endif
  39022 
  39023 #ifdef __LITTLE_ENDIAN__
  39024 #define vld1q_f16_x4(__p0) __extension__ ({ \
  39025   float16x8x4_t __ret; \
  39026   __builtin_neon_vld1q_x4_v(&__ret, __p0, 40); \
  39027   __ret; \
  39028 })
  39029 #else
  39030 #define vld1q_f16_x4(__p0) __extension__ ({ \
  39031   float16x8x4_t __ret; \
  39032   __builtin_neon_vld1q_x4_v(&__ret, __p0, 40); \
  39033  \
  39034   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39035   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39036   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39037   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39038   __ret; \
  39039 })
  39040 #endif
  39041 
  39042 #ifdef __LITTLE_ENDIAN__
  39043 #define vld1_f16_x4(__p0) __extension__ ({ \
  39044   float16x4x4_t __ret; \
  39045   __builtin_neon_vld1_x4_v(&__ret, __p0, 8); \
  39046   __ret; \
  39047 })
  39048 #else
  39049 #define vld1_f16_x4(__p0) __extension__ ({ \
  39050   float16x4x4_t __ret; \
  39051   __builtin_neon_vld1_x4_v(&__ret, __p0, 8); \
  39052  \
  39053   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39054   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39055   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39056   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  39057   __ret; \
  39058 })
  39059 #endif
  39060 
  39061 #ifdef __LITTLE_ENDIAN__
  39062 #define vld2q_f16(__p0) __extension__ ({ \
  39063   float16x8x2_t __ret; \
  39064   __builtin_neon_vld2q_v(&__ret, __p0, 40); \
  39065   __ret; \
  39066 })
  39067 #else
  39068 #define vld2q_f16(__p0) __extension__ ({ \
  39069   float16x8x2_t __ret; \
  39070   __builtin_neon_vld2q_v(&__ret, __p0, 40); \
  39071  \
  39072   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39073   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39074   __ret; \
  39075 })
  39076 #endif
  39077 
  39078 #ifdef __LITTLE_ENDIAN__
  39079 #define vld2_f16(__p0) __extension__ ({ \
  39080   float16x4x2_t __ret; \
  39081   __builtin_neon_vld2_v(&__ret, __p0, 8); \
  39082   __ret; \
  39083 })
  39084 #else
  39085 #define vld2_f16(__p0) __extension__ ({ \
  39086   float16x4x2_t __ret; \
  39087   __builtin_neon_vld2_v(&__ret, __p0, 8); \
  39088  \
  39089   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39090   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39091   __ret; \
  39092 })
  39093 #endif
  39094 
  39095 #ifdef __LITTLE_ENDIAN__
  39096 #define vld2q_dup_f16(__p0) __extension__ ({ \
  39097   float16x8x2_t __ret; \
  39098   __builtin_neon_vld2q_dup_v(&__ret, __p0, 40); \
  39099   __ret; \
  39100 })
  39101 #else
  39102 #define vld2q_dup_f16(__p0) __extension__ ({ \
  39103   float16x8x2_t __ret; \
  39104   __builtin_neon_vld2q_dup_v(&__ret, __p0, 40); \
  39105  \
  39106   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39107   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39108   __ret; \
  39109 })
  39110 #endif
  39111 
  39112 #ifdef __LITTLE_ENDIAN__
  39113 #define vld2_dup_f16(__p0) __extension__ ({ \
  39114   float16x4x2_t __ret; \
  39115   __builtin_neon_vld2_dup_v(&__ret, __p0, 8); \
  39116   __ret; \
  39117 })
  39118 #else
  39119 #define vld2_dup_f16(__p0) __extension__ ({ \
  39120   float16x4x2_t __ret; \
  39121   __builtin_neon_vld2_dup_v(&__ret, __p0, 8); \
  39122  \
  39123   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39124   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39125   __ret; \
  39126 })
  39127 #endif
  39128 
  39129 #ifdef __LITTLE_ENDIAN__
  39130 #define vld2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39131   float16x8x2_t __ret; \
  39132   float16x8x2_t __s1 = __p1; \
  39133   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 40); \
  39134   __ret; \
  39135 })
  39136 #else
  39137 #define vld2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39138   float16x8x2_t __ret; \
  39139   float16x8x2_t __s1 = __p1; \
  39140   float16x8x2_t __rev1; \
  39141   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39142   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39143   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 40); \
  39144  \
  39145   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39146   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39147   __ret; \
  39148 })
  39149 #endif
  39150 
  39151 #ifdef __LITTLE_ENDIAN__
  39152 #define vld2_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39153   float16x4x2_t __ret; \
  39154   float16x4x2_t __s1 = __p1; \
  39155   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 8); \
  39156   __ret; \
  39157 })
  39158 #else
  39159 #define vld2_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39160   float16x4x2_t __ret; \
  39161   float16x4x2_t __s1 = __p1; \
  39162   float16x4x2_t __rev1; \
  39163   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39164   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39165   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 8); \
  39166  \
  39167   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39168   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39169   __ret; \
  39170 })
  39171 #endif
  39172 
  39173 #ifdef __LITTLE_ENDIAN__
  39174 #define vld3q_f16(__p0) __extension__ ({ \
  39175   float16x8x3_t __ret; \
  39176   __builtin_neon_vld3q_v(&__ret, __p0, 40); \
  39177   __ret; \
  39178 })
  39179 #else
  39180 #define vld3q_f16(__p0) __extension__ ({ \
  39181   float16x8x3_t __ret; \
  39182   __builtin_neon_vld3q_v(&__ret, __p0, 40); \
  39183  \
  39184   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39185   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39186   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39187   __ret; \
  39188 })
  39189 #endif
  39190 
  39191 #ifdef __LITTLE_ENDIAN__
  39192 #define vld3_f16(__p0) __extension__ ({ \
  39193   float16x4x3_t __ret; \
  39194   __builtin_neon_vld3_v(&__ret, __p0, 8); \
  39195   __ret; \
  39196 })
  39197 #else
  39198 #define vld3_f16(__p0) __extension__ ({ \
  39199   float16x4x3_t __ret; \
  39200   __builtin_neon_vld3_v(&__ret, __p0, 8); \
  39201  \
  39202   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39203   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39204   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39205   __ret; \
  39206 })
  39207 #endif
  39208 
  39209 #ifdef __LITTLE_ENDIAN__
  39210 #define vld3q_dup_f16(__p0) __extension__ ({ \
  39211   float16x8x3_t __ret; \
  39212   __builtin_neon_vld3q_dup_v(&__ret, __p0, 40); \
  39213   __ret; \
  39214 })
  39215 #else
  39216 #define vld3q_dup_f16(__p0) __extension__ ({ \
  39217   float16x8x3_t __ret; \
  39218   __builtin_neon_vld3q_dup_v(&__ret, __p0, 40); \
  39219  \
  39220   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39221   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39222   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39223   __ret; \
  39224 })
  39225 #endif
  39226 
  39227 #ifdef __LITTLE_ENDIAN__
  39228 #define vld3_dup_f16(__p0) __extension__ ({ \
  39229   float16x4x3_t __ret; \
  39230   __builtin_neon_vld3_dup_v(&__ret, __p0, 8); \
  39231   __ret; \
  39232 })
  39233 #else
  39234 #define vld3_dup_f16(__p0) __extension__ ({ \
  39235   float16x4x3_t __ret; \
  39236   __builtin_neon_vld3_dup_v(&__ret, __p0, 8); \
  39237  \
  39238   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39239   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39240   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39241   __ret; \
  39242 })
  39243 #endif
  39244 
  39245 #ifdef __LITTLE_ENDIAN__
  39246 #define vld3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39247   float16x8x3_t __ret; \
  39248   float16x8x3_t __s1 = __p1; \
  39249   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 40); \
  39250   __ret; \
  39251 })
  39252 #else
  39253 #define vld3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39254   float16x8x3_t __ret; \
  39255   float16x8x3_t __s1 = __p1; \
  39256   float16x8x3_t __rev1; \
  39257   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39258   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39259   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39260   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 40); \
  39261  \
  39262   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39263   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39264   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39265   __ret; \
  39266 })
  39267 #endif
  39268 
  39269 #ifdef __LITTLE_ENDIAN__
  39270 #define vld3_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39271   float16x4x3_t __ret; \
  39272   float16x4x3_t __s1 = __p1; \
  39273   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 8); \
  39274   __ret; \
  39275 })
  39276 #else
  39277 #define vld3_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39278   float16x4x3_t __ret; \
  39279   float16x4x3_t __s1 = __p1; \
  39280   float16x4x3_t __rev1; \
  39281   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39282   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39283   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39284   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 8); \
  39285  \
  39286   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39287   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39288   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39289   __ret; \
  39290 })
  39291 #endif
  39292 
  39293 #ifdef __LITTLE_ENDIAN__
  39294 #define vld4q_f16(__p0) __extension__ ({ \
  39295   float16x8x4_t __ret; \
  39296   __builtin_neon_vld4q_v(&__ret, __p0, 40); \
  39297   __ret; \
  39298 })
  39299 #else
  39300 #define vld4q_f16(__p0) __extension__ ({ \
  39301   float16x8x4_t __ret; \
  39302   __builtin_neon_vld4q_v(&__ret, __p0, 40); \
  39303  \
  39304   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39305   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39306   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39307   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39308   __ret; \
  39309 })
  39310 #endif
  39311 
  39312 #ifdef __LITTLE_ENDIAN__
  39313 #define vld4_f16(__p0) __extension__ ({ \
  39314   float16x4x4_t __ret; \
  39315   __builtin_neon_vld4_v(&__ret, __p0, 8); \
  39316   __ret; \
  39317 })
  39318 #else
  39319 #define vld4_f16(__p0) __extension__ ({ \
  39320   float16x4x4_t __ret; \
  39321   __builtin_neon_vld4_v(&__ret, __p0, 8); \
  39322  \
  39323   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39324   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39325   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39326   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  39327   __ret; \
  39328 })
  39329 #endif
  39330 
  39331 #ifdef __LITTLE_ENDIAN__
  39332 #define vld4q_dup_f16(__p0) __extension__ ({ \
  39333   float16x8x4_t __ret; \
  39334   __builtin_neon_vld4q_dup_v(&__ret, __p0, 40); \
  39335   __ret; \
  39336 })
  39337 #else
  39338 #define vld4q_dup_f16(__p0) __extension__ ({ \
  39339   float16x8x4_t __ret; \
  39340   __builtin_neon_vld4q_dup_v(&__ret, __p0, 40); \
  39341  \
  39342   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39343   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39344   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39345   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39346   __ret; \
  39347 })
  39348 #endif
  39349 
  39350 #ifdef __LITTLE_ENDIAN__
  39351 #define vld4_dup_f16(__p0) __extension__ ({ \
  39352   float16x4x4_t __ret; \
  39353   __builtin_neon_vld4_dup_v(&__ret, __p0, 8); \
  39354   __ret; \
  39355 })
  39356 #else
  39357 #define vld4_dup_f16(__p0) __extension__ ({ \
  39358   float16x4x4_t __ret; \
  39359   __builtin_neon_vld4_dup_v(&__ret, __p0, 8); \
  39360  \
  39361   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39362   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39363   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39364   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  39365   __ret; \
  39366 })
  39367 #endif
  39368 
  39369 #ifdef __LITTLE_ENDIAN__
  39370 #define vld4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39371   float16x8x4_t __ret; \
  39372   float16x8x4_t __s1 = __p1; \
  39373   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 40); \
  39374   __ret; \
  39375 })
  39376 #else
  39377 #define vld4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39378   float16x8x4_t __ret; \
  39379   float16x8x4_t __s1 = __p1; \
  39380   float16x8x4_t __rev1; \
  39381   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39382   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39383   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39384   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39385   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 40); \
  39386  \
  39387   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39388   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39389   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39390   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39391   __ret; \
  39392 })
  39393 #endif
  39394 
  39395 #ifdef __LITTLE_ENDIAN__
  39396 #define vld4_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39397   float16x4x4_t __ret; \
  39398   float16x4x4_t __s1 = __p1; \
  39399   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 8); \
  39400   __ret; \
  39401 })
  39402 #else
  39403 #define vld4_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39404   float16x4x4_t __ret; \
  39405   float16x4x4_t __s1 = __p1; \
  39406   float16x4x4_t __rev1; \
  39407   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39408   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39409   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39410   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  39411   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 8); \
  39412  \
  39413   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \
  39414   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \
  39415   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \
  39416   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \
  39417   __ret; \
  39418 })
  39419 #endif
  39420 
  39421 #ifdef __LITTLE_ENDIAN__
  39422 #define vst1q_f16(__p0, __p1) __extension__ ({ \
  39423   float16x8_t __s1 = __p1; \
  39424   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 40); \
  39425 })
  39426 #else
  39427 #define vst1q_f16(__p0, __p1) __extension__ ({ \
  39428   float16x8_t __s1 = __p1; \
  39429   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  39430   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 40); \
  39431 })
  39432 #endif
  39433 
  39434 #ifdef __LITTLE_ENDIAN__
  39435 #define vst1_f16(__p0, __p1) __extension__ ({ \
  39436   float16x4_t __s1 = __p1; \
  39437   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 8); \
  39438 })
  39439 #else
  39440 #define vst1_f16(__p0, __p1) __extension__ ({ \
  39441   float16x4_t __s1 = __p1; \
  39442   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  39443   __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 8); \
  39444 })
  39445 #endif
  39446 
  39447 #ifdef __LITTLE_ENDIAN__
  39448 #define vst1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39449   float16x8_t __s1 = __p1; \
  39450   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 40); \
  39451 })
  39452 #else
  39453 #define vst1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39454   float16x8_t __s1 = __p1; \
  39455   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  39456   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 40); \
  39457 })
  39458 #endif
  39459 
  39460 #ifdef __LITTLE_ENDIAN__
  39461 #define vst1_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39462   float16x4_t __s1 = __p1; \
  39463   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 8); \
  39464 })
  39465 #else
  39466 #define vst1_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39467   float16x4_t __s1 = __p1; \
  39468   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  39469   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 8); \
  39470 })
  39471 #endif
  39472 
  39473 #ifdef __LITTLE_ENDIAN__
  39474 #define vst1q_f16_x2(__p0, __p1) __extension__ ({ \
  39475   float16x8x2_t __s1 = __p1; \
  39476   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 40); \
  39477 })
  39478 #else
  39479 #define vst1q_f16_x2(__p0, __p1) __extension__ ({ \
  39480   float16x8x2_t __s1 = __p1; \
  39481   float16x8x2_t __rev1; \
  39482   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39483   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39484   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 40); \
  39485 })
  39486 #endif
  39487 
  39488 #ifdef __LITTLE_ENDIAN__
  39489 #define vst1_f16_x2(__p0, __p1) __extension__ ({ \
  39490   float16x4x2_t __s1 = __p1; \
  39491   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 8); \
  39492 })
  39493 #else
  39494 #define vst1_f16_x2(__p0, __p1) __extension__ ({ \
  39495   float16x4x2_t __s1 = __p1; \
  39496   float16x4x2_t __rev1; \
  39497   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39498   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39499   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 8); \
  39500 })
  39501 #endif
  39502 
  39503 #ifdef __LITTLE_ENDIAN__
  39504 #define vst1q_f16_x3(__p0, __p1) __extension__ ({ \
  39505   float16x8x3_t __s1 = __p1; \
  39506   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 40); \
  39507 })
  39508 #else
  39509 #define vst1q_f16_x3(__p0, __p1) __extension__ ({ \
  39510   float16x8x3_t __s1 = __p1; \
  39511   float16x8x3_t __rev1; \
  39512   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39513   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39514   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39515   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 40); \
  39516 })
  39517 #endif
  39518 
  39519 #ifdef __LITTLE_ENDIAN__
  39520 #define vst1_f16_x3(__p0, __p1) __extension__ ({ \
  39521   float16x4x3_t __s1 = __p1; \
  39522   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 8); \
  39523 })
  39524 #else
  39525 #define vst1_f16_x3(__p0, __p1) __extension__ ({ \
  39526   float16x4x3_t __s1 = __p1; \
  39527   float16x4x3_t __rev1; \
  39528   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39529   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39530   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39531   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 8); \
  39532 })
  39533 #endif
  39534 
  39535 #ifdef __LITTLE_ENDIAN__
  39536 #define vst1q_f16_x4(__p0, __p1) __extension__ ({ \
  39537   float16x8x4_t __s1 = __p1; \
  39538   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 40); \
  39539 })
  39540 #else
  39541 #define vst1q_f16_x4(__p0, __p1) __extension__ ({ \
  39542   float16x8x4_t __s1 = __p1; \
  39543   float16x8x4_t __rev1; \
  39544   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39545   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39546   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39547   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39548   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 40); \
  39549 })
  39550 #endif
  39551 
  39552 #ifdef __LITTLE_ENDIAN__
  39553 #define vst1_f16_x4(__p0, __p1) __extension__ ({ \
  39554   float16x4x4_t __s1 = __p1; \
  39555   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 8); \
  39556 })
  39557 #else
  39558 #define vst1_f16_x4(__p0, __p1) __extension__ ({ \
  39559   float16x4x4_t __s1 = __p1; \
  39560   float16x4x4_t __rev1; \
  39561   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39562   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39563   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39564   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  39565   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 8); \
  39566 })
  39567 #endif
  39568 
  39569 #ifdef __LITTLE_ENDIAN__
  39570 #define vst2q_f16(__p0, __p1) __extension__ ({ \
  39571   float16x8x2_t __s1 = __p1; \
  39572   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 40); \
  39573 })
  39574 #else
  39575 #define vst2q_f16(__p0, __p1) __extension__ ({ \
  39576   float16x8x2_t __s1 = __p1; \
  39577   float16x8x2_t __rev1; \
  39578   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39579   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39580   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 40); \
  39581 })
  39582 #endif
  39583 
  39584 #ifdef __LITTLE_ENDIAN__
  39585 #define vst2_f16(__p0, __p1) __extension__ ({ \
  39586   float16x4x2_t __s1 = __p1; \
  39587   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 8); \
  39588 })
  39589 #else
  39590 #define vst2_f16(__p0, __p1) __extension__ ({ \
  39591   float16x4x2_t __s1 = __p1; \
  39592   float16x4x2_t __rev1; \
  39593   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39594   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39595   __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 8); \
  39596 })
  39597 #endif
  39598 
  39599 #ifdef __LITTLE_ENDIAN__
  39600 #define vst2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39601   float16x8x2_t __s1 = __p1; \
  39602   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 40); \
  39603 })
  39604 #else
  39605 #define vst2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39606   float16x8x2_t __s1 = __p1; \
  39607   float16x8x2_t __rev1; \
  39608   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39609   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39610   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 40); \
  39611 })
  39612 #endif
  39613 
  39614 #ifdef __LITTLE_ENDIAN__
  39615 #define vst2_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39616   float16x4x2_t __s1 = __p1; \
  39617   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 8); \
  39618 })
  39619 #else
  39620 #define vst2_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39621   float16x4x2_t __s1 = __p1; \
  39622   float16x4x2_t __rev1; \
  39623   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39624   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39625   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 8); \
  39626 })
  39627 #endif
  39628 
  39629 #ifdef __LITTLE_ENDIAN__
  39630 #define vst3q_f16(__p0, __p1) __extension__ ({ \
  39631   float16x8x3_t __s1 = __p1; \
  39632   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 40); \
  39633 })
  39634 #else
  39635 #define vst3q_f16(__p0, __p1) __extension__ ({ \
  39636   float16x8x3_t __s1 = __p1; \
  39637   float16x8x3_t __rev1; \
  39638   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39639   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39640   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39641   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 40); \
  39642 })
  39643 #endif
  39644 
  39645 #ifdef __LITTLE_ENDIAN__
  39646 #define vst3_f16(__p0, __p1) __extension__ ({ \
  39647   float16x4x3_t __s1 = __p1; \
  39648   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 8); \
  39649 })
  39650 #else
  39651 #define vst3_f16(__p0, __p1) __extension__ ({ \
  39652   float16x4x3_t __s1 = __p1; \
  39653   float16x4x3_t __rev1; \
  39654   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39655   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39656   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39657   __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 8); \
  39658 })
  39659 #endif
  39660 
  39661 #ifdef __LITTLE_ENDIAN__
  39662 #define vst3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39663   float16x8x3_t __s1 = __p1; \
  39664   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 40); \
  39665 })
  39666 #else
  39667 #define vst3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39668   float16x8x3_t __s1 = __p1; \
  39669   float16x8x3_t __rev1; \
  39670   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39671   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39672   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39673   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 40); \
  39674 })
  39675 #endif
  39676 
  39677 #ifdef __LITTLE_ENDIAN__
  39678 #define vst3_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39679   float16x4x3_t __s1 = __p1; \
  39680   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 8); \
  39681 })
  39682 #else
  39683 #define vst3_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39684   float16x4x3_t __s1 = __p1; \
  39685   float16x4x3_t __rev1; \
  39686   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39687   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39688   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39689   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 8); \
  39690 })
  39691 #endif
  39692 
  39693 #ifdef __LITTLE_ENDIAN__
  39694 #define vst4q_f16(__p0, __p1) __extension__ ({ \
  39695   float16x8x4_t __s1 = __p1; \
  39696   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 40); \
  39697 })
  39698 #else
  39699 #define vst4q_f16(__p0, __p1) __extension__ ({ \
  39700   float16x8x4_t __s1 = __p1; \
  39701   float16x8x4_t __rev1; \
  39702   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39703   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39704   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39705   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39706   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 40); \
  39707 })
  39708 #endif
  39709 
  39710 #ifdef __LITTLE_ENDIAN__
  39711 #define vst4_f16(__p0, __p1) __extension__ ({ \
  39712   float16x4x4_t __s1 = __p1; \
  39713   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 8); \
  39714 })
  39715 #else
  39716 #define vst4_f16(__p0, __p1) __extension__ ({ \
  39717   float16x4x4_t __s1 = __p1; \
  39718   float16x4x4_t __rev1; \
  39719   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39720   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39721   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39722   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  39723   __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 8); \
  39724 })
  39725 #endif
  39726 
  39727 #ifdef __LITTLE_ENDIAN__
  39728 #define vst4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39729   float16x8x4_t __s1 = __p1; \
  39730   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 40); \
  39731 })
  39732 #else
  39733 #define vst4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39734   float16x8x4_t __s1 = __p1; \
  39735   float16x8x4_t __rev1; \
  39736   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  39737   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  39738   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \
  39739   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \
  39740   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 40); \
  39741 })
  39742 #endif
  39743 
  39744 #ifdef __LITTLE_ENDIAN__
  39745 #define vst4_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39746   float16x4x4_t __s1 = __p1; \
  39747   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 8); \
  39748 })
  39749 #else
  39750 #define vst4_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  39751   float16x4x4_t __s1 = __p1; \
  39752   float16x4x4_t __rev1; \
  39753   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \
  39754   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \
  39755   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \
  39756   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \
  39757   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 8); \
  39758 })
  39759 #endif
  39760 
  39761 #endif
  39762 #if (defined(__aarch64__)  || defined(__arm64ec__)) && defined(__ARM_FEATURE_NUMERIC_MAXMIN)
  39763 #ifdef __LITTLE_ENDIAN__
  39764 __ai __attribute__((target("neon"))) float64x2_t vmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  39765   float64x2_t __ret;
  39766   __ret = (float64x2_t) __builtin_neon_vmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  39767   return __ret;
  39768 }
  39769 #else
  39770 __ai __attribute__((target("neon"))) float64x2_t vmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  39771   float64x2_t __ret;
  39772   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39773   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  39774   __ret = (float64x2_t) __builtin_neon_vmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  39775   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39776   return __ret;
  39777 }
  39778 #endif
  39779 
  39780 __ai __attribute__((target("neon"))) float64x1_t vmaxnm_f64(float64x1_t __p0, float64x1_t __p1) {
  39781   float64x1_t __ret;
  39782   __ret = (float64x1_t) __builtin_neon_vmaxnm_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  39783   return __ret;
  39784 }
  39785 #ifdef __LITTLE_ENDIAN__
  39786 __ai __attribute__((target("neon"))) float64x2_t vminnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  39787   float64x2_t __ret;
  39788   __ret = (float64x2_t) __builtin_neon_vminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  39789   return __ret;
  39790 }
  39791 #else
  39792 __ai __attribute__((target("neon"))) float64x2_t vminnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  39793   float64x2_t __ret;
  39794   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39795   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  39796   __ret = (float64x2_t) __builtin_neon_vminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  39797   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39798   return __ret;
  39799 }
  39800 #endif
  39801 
  39802 __ai __attribute__((target("neon"))) float64x1_t vminnm_f64(float64x1_t __p0, float64x1_t __p1) {
  39803   float64x1_t __ret;
  39804   __ret = (float64x1_t) __builtin_neon_vminnm_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  39805   return __ret;
  39806 }
  39807 #endif
  39808 #if (defined(__aarch64__) || defined(__arm64ec__)) && defined(__ARM_FEATURE_DIRECTED_ROUNDING)
  39809 #ifdef __LITTLE_ENDIAN__
  39810 __ai __attribute__((target("neon"))) float64x2_t vrndq_f64(float64x2_t __p0) {
  39811   float64x2_t __ret;
  39812   __ret = (float64x2_t) __builtin_neon_vrndq_v((int8x16_t)__p0, 42);
  39813   return __ret;
  39814 }
  39815 #else
  39816 __ai __attribute__((target("neon"))) float64x2_t vrndq_f64(float64x2_t __p0) {
  39817   float64x2_t __ret;
  39818   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39819   __ret = (float64x2_t) __builtin_neon_vrndq_v((int8x16_t)__rev0, 42);
  39820   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39821   return __ret;
  39822 }
  39823 #endif
  39824 
  39825 __ai __attribute__((target("neon"))) float64x1_t vrnd_f64(float64x1_t __p0) {
  39826   float64x1_t __ret;
  39827   __ret = (float64x1_t) __builtin_neon_vrnd_v((int8x8_t)__p0, 10);
  39828   return __ret;
  39829 }
  39830 #ifdef __LITTLE_ENDIAN__
  39831 __ai __attribute__((target("neon"))) float64x2_t vrndaq_f64(float64x2_t __p0) {
  39832   float64x2_t __ret;
  39833   __ret = (float64x2_t) __builtin_neon_vrndaq_v((int8x16_t)__p0, 42);
  39834   return __ret;
  39835 }
  39836 #else
  39837 __ai __attribute__((target("neon"))) float64x2_t vrndaq_f64(float64x2_t __p0) {
  39838   float64x2_t __ret;
  39839   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39840   __ret = (float64x2_t) __builtin_neon_vrndaq_v((int8x16_t)__rev0, 42);
  39841   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39842   return __ret;
  39843 }
  39844 #endif
  39845 
  39846 __ai __attribute__((target("neon"))) float64x1_t vrnda_f64(float64x1_t __p0) {
  39847   float64x1_t __ret;
  39848   __ret = (float64x1_t) __builtin_neon_vrnda_v((int8x8_t)__p0, 10);
  39849   return __ret;
  39850 }
  39851 #ifdef __LITTLE_ENDIAN__
  39852 __ai __attribute__((target("neon"))) float64x2_t vrndiq_f64(float64x2_t __p0) {
  39853   float64x2_t __ret;
  39854   __ret = (float64x2_t) __builtin_neon_vrndiq_v((int8x16_t)__p0, 42);
  39855   return __ret;
  39856 }
  39857 #else
  39858 __ai __attribute__((target("neon"))) float64x2_t vrndiq_f64(float64x2_t __p0) {
  39859   float64x2_t __ret;
  39860   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39861   __ret = (float64x2_t) __builtin_neon_vrndiq_v((int8x16_t)__rev0, 42);
  39862   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39863   return __ret;
  39864 }
  39865 #endif
  39866 
  39867 __ai __attribute__((target("neon"))) float64x1_t vrndi_f64(float64x1_t __p0) {
  39868   float64x1_t __ret;
  39869   __ret = (float64x1_t) __builtin_neon_vrndi_v((int8x8_t)__p0, 10);
  39870   return __ret;
  39871 }
  39872 #ifdef __LITTLE_ENDIAN__
  39873 __ai __attribute__((target("neon"))) float64x2_t vrndmq_f64(float64x2_t __p0) {
  39874   float64x2_t __ret;
  39875   __ret = (float64x2_t) __builtin_neon_vrndmq_v((int8x16_t)__p0, 42);
  39876   return __ret;
  39877 }
  39878 #else
  39879 __ai __attribute__((target("neon"))) float64x2_t vrndmq_f64(float64x2_t __p0) {
  39880   float64x2_t __ret;
  39881   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39882   __ret = (float64x2_t) __builtin_neon_vrndmq_v((int8x16_t)__rev0, 42);
  39883   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39884   return __ret;
  39885 }
  39886 #endif
  39887 
  39888 __ai __attribute__((target("neon"))) float64x1_t vrndm_f64(float64x1_t __p0) {
  39889   float64x1_t __ret;
  39890   __ret = (float64x1_t) __builtin_neon_vrndm_v((int8x8_t)__p0, 10);
  39891   return __ret;
  39892 }
  39893 #ifdef __LITTLE_ENDIAN__
  39894 __ai __attribute__((target("neon"))) float64x2_t vrndnq_f64(float64x2_t __p0) {
  39895   float64x2_t __ret;
  39896   __ret = (float64x2_t) __builtin_neon_vrndnq_v((int8x16_t)__p0, 42);
  39897   return __ret;
  39898 }
  39899 #else
  39900 __ai __attribute__((target("neon"))) float64x2_t vrndnq_f64(float64x2_t __p0) {
  39901   float64x2_t __ret;
  39902   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39903   __ret = (float64x2_t) __builtin_neon_vrndnq_v((int8x16_t)__rev0, 42);
  39904   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39905   return __ret;
  39906 }
  39907 #endif
  39908 
  39909 __ai __attribute__((target("neon"))) float64x1_t vrndn_f64(float64x1_t __p0) {
  39910   float64x1_t __ret;
  39911   __ret = (float64x1_t) __builtin_neon_vrndn_v((int8x8_t)__p0, 10);
  39912   return __ret;
  39913 }
  39914 #ifdef __LITTLE_ENDIAN__
  39915 __ai __attribute__((target("neon"))) float64x2_t vrndpq_f64(float64x2_t __p0) {
  39916   float64x2_t __ret;
  39917   __ret = (float64x2_t) __builtin_neon_vrndpq_v((int8x16_t)__p0, 42);
  39918   return __ret;
  39919 }
  39920 #else
  39921 __ai __attribute__((target("neon"))) float64x2_t vrndpq_f64(float64x2_t __p0) {
  39922   float64x2_t __ret;
  39923   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39924   __ret = (float64x2_t) __builtin_neon_vrndpq_v((int8x16_t)__rev0, 42);
  39925   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39926   return __ret;
  39927 }
  39928 #endif
  39929 
  39930 __ai __attribute__((target("neon"))) float64x1_t vrndp_f64(float64x1_t __p0) {
  39931   float64x1_t __ret;
  39932   __ret = (float64x1_t) __builtin_neon_vrndp_v((int8x8_t)__p0, 10);
  39933   return __ret;
  39934 }
  39935 #ifdef __LITTLE_ENDIAN__
  39936 __ai __attribute__((target("neon"))) float64x2_t vrndxq_f64(float64x2_t __p0) {
  39937   float64x2_t __ret;
  39938   __ret = (float64x2_t) __builtin_neon_vrndxq_v((int8x16_t)__p0, 42);
  39939   return __ret;
  39940 }
  39941 #else
  39942 __ai __attribute__((target("neon"))) float64x2_t vrndxq_f64(float64x2_t __p0) {
  39943   float64x2_t __ret;
  39944   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  39945   __ret = (float64x2_t) __builtin_neon_vrndxq_v((int8x16_t)__rev0, 42);
  39946   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  39947   return __ret;
  39948 }
  39949 #endif
  39950 
  39951 __ai __attribute__((target("neon"))) float64x1_t vrndx_f64(float64x1_t __p0) {
  39952   float64x1_t __ret;
  39953   __ret = (float64x1_t) __builtin_neon_vrndx_v((int8x8_t)__p0, 10);
  39954   return __ret;
  39955 }
  39956 #endif
  39957 #if __ARM_ARCH >= 8
  39958 #ifdef __LITTLE_ENDIAN__
  39959 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesdq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  39960   uint8x16_t __ret;
  39961   __ret = (uint8x16_t) __builtin_neon_vaesdq_u8((int8x16_t)__p0, (int8x16_t)__p1, 48);
  39962   return __ret;
  39963 }
  39964 #else
  39965 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesdq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  39966   uint8x16_t __ret;
  39967   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  39968   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  39969   __ret = (uint8x16_t) __builtin_neon_vaesdq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  39970   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  39971   return __ret;
  39972 }
  39973 #endif
  39974 
  39975 #ifdef __LITTLE_ENDIAN__
  39976 __ai __attribute__((target("aes,neon"))) uint8x16_t vaeseq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  39977   uint8x16_t __ret;
  39978   __ret = (uint8x16_t) __builtin_neon_vaeseq_u8((int8x16_t)__p0, (int8x16_t)__p1, 48);
  39979   return __ret;
  39980 }
  39981 #else
  39982 __ai __attribute__((target("aes,neon"))) uint8x16_t vaeseq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  39983   uint8x16_t __ret;
  39984   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  39985   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  39986   __ret = (uint8x16_t) __builtin_neon_vaeseq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  39987   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  39988   return __ret;
  39989 }
  39990 #endif
  39991 
  39992 #ifdef __LITTLE_ENDIAN__
  39993 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesimcq_u8(uint8x16_t __p0) {
  39994   uint8x16_t __ret;
  39995   __ret = (uint8x16_t) __builtin_neon_vaesimcq_u8((int8x16_t)__p0, 48);
  39996   return __ret;
  39997 }
  39998 #else
  39999 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesimcq_u8(uint8x16_t __p0) {
  40000   uint8x16_t __ret;
  40001   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  40002   __ret = (uint8x16_t) __builtin_neon_vaesimcq_u8((int8x16_t)__rev0, 48);
  40003   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  40004   return __ret;
  40005 }
  40006 #endif
  40007 
  40008 #ifdef __LITTLE_ENDIAN__
  40009 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesmcq_u8(uint8x16_t __p0) {
  40010   uint8x16_t __ret;
  40011   __ret = (uint8x16_t) __builtin_neon_vaesmcq_u8((int8x16_t)__p0, 48);
  40012   return __ret;
  40013 }
  40014 #else
  40015 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesmcq_u8(uint8x16_t __p0) {
  40016   uint8x16_t __ret;
  40017   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  40018   __ret = (uint8x16_t) __builtin_neon_vaesmcq_u8((int8x16_t)__rev0, 48);
  40019   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  40020   return __ret;
  40021 }
  40022 #endif
  40023 
  40024 #ifdef __LITTLE_ENDIAN__
  40025 __ai __attribute__((target("neon"))) int32x4_t vcvtaq_s32_f32(float32x4_t __p0) {
  40026   int32x4_t __ret;
  40027   __ret = (int32x4_t) __builtin_neon_vcvtaq_s32_v((int8x16_t)__p0, 34);
  40028   return __ret;
  40029 }
  40030 #else
  40031 __ai __attribute__((target("neon"))) int32x4_t vcvtaq_s32_f32(float32x4_t __p0) {
  40032   int32x4_t __ret;
  40033   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40034   __ret = (int32x4_t) __builtin_neon_vcvtaq_s32_v((int8x16_t)__rev0, 34);
  40035   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40036   return __ret;
  40037 }
  40038 #endif
  40039 
  40040 #ifdef __LITTLE_ENDIAN__
  40041 __ai __attribute__((target("neon"))) int32x2_t vcvta_s32_f32(float32x2_t __p0) {
  40042   int32x2_t __ret;
  40043   __ret = (int32x2_t) __builtin_neon_vcvta_s32_v((int8x8_t)__p0, 2);
  40044   return __ret;
  40045 }
  40046 #else
  40047 __ai __attribute__((target("neon"))) int32x2_t vcvta_s32_f32(float32x2_t __p0) {
  40048   int32x2_t __ret;
  40049   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40050   __ret = (int32x2_t) __builtin_neon_vcvta_s32_v((int8x8_t)__rev0, 2);
  40051   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40052   return __ret;
  40053 }
  40054 #endif
  40055 
  40056 #ifdef __LITTLE_ENDIAN__
  40057 __ai __attribute__((target("neon"))) uint32x4_t vcvtaq_u32_f32(float32x4_t __p0) {
  40058   uint32x4_t __ret;
  40059   __ret = (uint32x4_t) __builtin_neon_vcvtaq_u32_v((int8x16_t)__p0, 50);
  40060   return __ret;
  40061 }
  40062 #else
  40063 __ai __attribute__((target("neon"))) uint32x4_t vcvtaq_u32_f32(float32x4_t __p0) {
  40064   uint32x4_t __ret;
  40065   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40066   __ret = (uint32x4_t) __builtin_neon_vcvtaq_u32_v((int8x16_t)__rev0, 50);
  40067   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40068   return __ret;
  40069 }
  40070 #endif
  40071 
  40072 #ifdef __LITTLE_ENDIAN__
  40073 __ai __attribute__((target("neon"))) uint32x2_t vcvta_u32_f32(float32x2_t __p0) {
  40074   uint32x2_t __ret;
  40075   __ret = (uint32x2_t) __builtin_neon_vcvta_u32_v((int8x8_t)__p0, 18);
  40076   return __ret;
  40077 }
  40078 #else
  40079 __ai __attribute__((target("neon"))) uint32x2_t vcvta_u32_f32(float32x2_t __p0) {
  40080   uint32x2_t __ret;
  40081   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40082   __ret = (uint32x2_t) __builtin_neon_vcvta_u32_v((int8x8_t)__rev0, 18);
  40083   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40084   return __ret;
  40085 }
  40086 #endif
  40087 
  40088 #ifdef __LITTLE_ENDIAN__
  40089 __ai __attribute__((target("neon"))) int32x4_t vcvtmq_s32_f32(float32x4_t __p0) {
  40090   int32x4_t __ret;
  40091   __ret = (int32x4_t) __builtin_neon_vcvtmq_s32_v((int8x16_t)__p0, 34);
  40092   return __ret;
  40093 }
  40094 #else
  40095 __ai __attribute__((target("neon"))) int32x4_t vcvtmq_s32_f32(float32x4_t __p0) {
  40096   int32x4_t __ret;
  40097   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40098   __ret = (int32x4_t) __builtin_neon_vcvtmq_s32_v((int8x16_t)__rev0, 34);
  40099   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40100   return __ret;
  40101 }
  40102 #endif
  40103 
  40104 #ifdef __LITTLE_ENDIAN__
  40105 __ai __attribute__((target("neon"))) int32x2_t vcvtm_s32_f32(float32x2_t __p0) {
  40106   int32x2_t __ret;
  40107   __ret = (int32x2_t) __builtin_neon_vcvtm_s32_v((int8x8_t)__p0, 2);
  40108   return __ret;
  40109 }
  40110 #else
  40111 __ai __attribute__((target("neon"))) int32x2_t vcvtm_s32_f32(float32x2_t __p0) {
  40112   int32x2_t __ret;
  40113   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40114   __ret = (int32x2_t) __builtin_neon_vcvtm_s32_v((int8x8_t)__rev0, 2);
  40115   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40116   return __ret;
  40117 }
  40118 #endif
  40119 
  40120 #ifdef __LITTLE_ENDIAN__
  40121 __ai __attribute__((target("neon"))) uint32x4_t vcvtmq_u32_f32(float32x4_t __p0) {
  40122   uint32x4_t __ret;
  40123   __ret = (uint32x4_t) __builtin_neon_vcvtmq_u32_v((int8x16_t)__p0, 50);
  40124   return __ret;
  40125 }
  40126 #else
  40127 __ai __attribute__((target("neon"))) uint32x4_t vcvtmq_u32_f32(float32x4_t __p0) {
  40128   uint32x4_t __ret;
  40129   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40130   __ret = (uint32x4_t) __builtin_neon_vcvtmq_u32_v((int8x16_t)__rev0, 50);
  40131   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40132   return __ret;
  40133 }
  40134 #endif
  40135 
  40136 #ifdef __LITTLE_ENDIAN__
  40137 __ai __attribute__((target("neon"))) uint32x2_t vcvtm_u32_f32(float32x2_t __p0) {
  40138   uint32x2_t __ret;
  40139   __ret = (uint32x2_t) __builtin_neon_vcvtm_u32_v((int8x8_t)__p0, 18);
  40140   return __ret;
  40141 }
  40142 #else
  40143 __ai __attribute__((target("neon"))) uint32x2_t vcvtm_u32_f32(float32x2_t __p0) {
  40144   uint32x2_t __ret;
  40145   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40146   __ret = (uint32x2_t) __builtin_neon_vcvtm_u32_v((int8x8_t)__rev0, 18);
  40147   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40148   return __ret;
  40149 }
  40150 #endif
  40151 
  40152 #ifdef __LITTLE_ENDIAN__
  40153 __ai __attribute__((target("neon"))) int32x4_t vcvtnq_s32_f32(float32x4_t __p0) {
  40154   int32x4_t __ret;
  40155   __ret = (int32x4_t) __builtin_neon_vcvtnq_s32_v((int8x16_t)__p0, 34);
  40156   return __ret;
  40157 }
  40158 #else
  40159 __ai __attribute__((target("neon"))) int32x4_t vcvtnq_s32_f32(float32x4_t __p0) {
  40160   int32x4_t __ret;
  40161   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40162   __ret = (int32x4_t) __builtin_neon_vcvtnq_s32_v((int8x16_t)__rev0, 34);
  40163   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40164   return __ret;
  40165 }
  40166 #endif
  40167 
  40168 #ifdef __LITTLE_ENDIAN__
  40169 __ai __attribute__((target("neon"))) int32x2_t vcvtn_s32_f32(float32x2_t __p0) {
  40170   int32x2_t __ret;
  40171   __ret = (int32x2_t) __builtin_neon_vcvtn_s32_v((int8x8_t)__p0, 2);
  40172   return __ret;
  40173 }
  40174 #else
  40175 __ai __attribute__((target("neon"))) int32x2_t vcvtn_s32_f32(float32x2_t __p0) {
  40176   int32x2_t __ret;
  40177   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40178   __ret = (int32x2_t) __builtin_neon_vcvtn_s32_v((int8x8_t)__rev0, 2);
  40179   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40180   return __ret;
  40181 }
  40182 #endif
  40183 
  40184 #ifdef __LITTLE_ENDIAN__
  40185 __ai __attribute__((target("neon"))) uint32x4_t vcvtnq_u32_f32(float32x4_t __p0) {
  40186   uint32x4_t __ret;
  40187   __ret = (uint32x4_t) __builtin_neon_vcvtnq_u32_v((int8x16_t)__p0, 50);
  40188   return __ret;
  40189 }
  40190 #else
  40191 __ai __attribute__((target("neon"))) uint32x4_t vcvtnq_u32_f32(float32x4_t __p0) {
  40192   uint32x4_t __ret;
  40193   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40194   __ret = (uint32x4_t) __builtin_neon_vcvtnq_u32_v((int8x16_t)__rev0, 50);
  40195   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40196   return __ret;
  40197 }
  40198 #endif
  40199 
  40200 #ifdef __LITTLE_ENDIAN__
  40201 __ai __attribute__((target("neon"))) uint32x2_t vcvtn_u32_f32(float32x2_t __p0) {
  40202   uint32x2_t __ret;
  40203   __ret = (uint32x2_t) __builtin_neon_vcvtn_u32_v((int8x8_t)__p0, 18);
  40204   return __ret;
  40205 }
  40206 #else
  40207 __ai __attribute__((target("neon"))) uint32x2_t vcvtn_u32_f32(float32x2_t __p0) {
  40208   uint32x2_t __ret;
  40209   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40210   __ret = (uint32x2_t) __builtin_neon_vcvtn_u32_v((int8x8_t)__rev0, 18);
  40211   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40212   return __ret;
  40213 }
  40214 #endif
  40215 
  40216 #ifdef __LITTLE_ENDIAN__
  40217 __ai __attribute__((target("neon"))) int32x4_t vcvtpq_s32_f32(float32x4_t __p0) {
  40218   int32x4_t __ret;
  40219   __ret = (int32x4_t) __builtin_neon_vcvtpq_s32_v((int8x16_t)__p0, 34);
  40220   return __ret;
  40221 }
  40222 #else
  40223 __ai __attribute__((target("neon"))) int32x4_t vcvtpq_s32_f32(float32x4_t __p0) {
  40224   int32x4_t __ret;
  40225   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40226   __ret = (int32x4_t) __builtin_neon_vcvtpq_s32_v((int8x16_t)__rev0, 34);
  40227   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40228   return __ret;
  40229 }
  40230 #endif
  40231 
  40232 #ifdef __LITTLE_ENDIAN__
  40233 __ai __attribute__((target("neon"))) int32x2_t vcvtp_s32_f32(float32x2_t __p0) {
  40234   int32x2_t __ret;
  40235   __ret = (int32x2_t) __builtin_neon_vcvtp_s32_v((int8x8_t)__p0, 2);
  40236   return __ret;
  40237 }
  40238 #else
  40239 __ai __attribute__((target("neon"))) int32x2_t vcvtp_s32_f32(float32x2_t __p0) {
  40240   int32x2_t __ret;
  40241   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40242   __ret = (int32x2_t) __builtin_neon_vcvtp_s32_v((int8x8_t)__rev0, 2);
  40243   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40244   return __ret;
  40245 }
  40246 #endif
  40247 
  40248 #ifdef __LITTLE_ENDIAN__
  40249 __ai __attribute__((target("neon"))) uint32x4_t vcvtpq_u32_f32(float32x4_t __p0) {
  40250   uint32x4_t __ret;
  40251   __ret = (uint32x4_t) __builtin_neon_vcvtpq_u32_v((int8x16_t)__p0, 50);
  40252   return __ret;
  40253 }
  40254 #else
  40255 __ai __attribute__((target("neon"))) uint32x4_t vcvtpq_u32_f32(float32x4_t __p0) {
  40256   uint32x4_t __ret;
  40257   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40258   __ret = (uint32x4_t) __builtin_neon_vcvtpq_u32_v((int8x16_t)__rev0, 50);
  40259   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40260   return __ret;
  40261 }
  40262 #endif
  40263 
  40264 #ifdef __LITTLE_ENDIAN__
  40265 __ai __attribute__((target("neon"))) uint32x2_t vcvtp_u32_f32(float32x2_t __p0) {
  40266   uint32x2_t __ret;
  40267   __ret = (uint32x2_t) __builtin_neon_vcvtp_u32_v((int8x8_t)__p0, 18);
  40268   return __ret;
  40269 }
  40270 #else
  40271 __ai __attribute__((target("neon"))) uint32x2_t vcvtp_u32_f32(float32x2_t __p0) {
  40272   uint32x2_t __ret;
  40273   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40274   __ret = (uint32x2_t) __builtin_neon_vcvtp_u32_v((int8x8_t)__rev0, 18);
  40275   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40276   return __ret;
  40277 }
  40278 #endif
  40279 
  40280 #ifdef __LITTLE_ENDIAN__
  40281 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1cq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) {
  40282   uint32x4_t __ret;
  40283   __ret = (uint32x4_t) __builtin_neon_vsha1cq_u32(__p0, __p1, __p2);
  40284   return __ret;
  40285 }
  40286 #else
  40287 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1cq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) {
  40288   uint32x4_t __ret;
  40289   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40290   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40291   __ret = (uint32x4_t) __builtin_neon_vsha1cq_u32(__rev0, __p1, __rev2);
  40292   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40293   return __ret;
  40294 }
  40295 #endif
  40296 
  40297 __ai __attribute__((target("sha2,neon"))) uint32_t vsha1h_u32(uint32_t __p0) {
  40298   uint32_t __ret;
  40299   __ret = (uint32_t) __builtin_neon_vsha1h_u32(__p0);
  40300   return __ret;
  40301 }
  40302 #ifdef __LITTLE_ENDIAN__
  40303 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1mq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) {
  40304   uint32x4_t __ret;
  40305   __ret = (uint32x4_t) __builtin_neon_vsha1mq_u32(__p0, __p1, __p2);
  40306   return __ret;
  40307 }
  40308 #else
  40309 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1mq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) {
  40310   uint32x4_t __ret;
  40311   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40312   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40313   __ret = (uint32x4_t) __builtin_neon_vsha1mq_u32(__rev0, __p1, __rev2);
  40314   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40315   return __ret;
  40316 }
  40317 #endif
  40318 
  40319 #ifdef __LITTLE_ENDIAN__
  40320 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1pq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) {
  40321   uint32x4_t __ret;
  40322   __ret = (uint32x4_t) __builtin_neon_vsha1pq_u32(__p0, __p1, __p2);
  40323   return __ret;
  40324 }
  40325 #else
  40326 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1pq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) {
  40327   uint32x4_t __ret;
  40328   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40329   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40330   __ret = (uint32x4_t) __builtin_neon_vsha1pq_u32(__rev0, __p1, __rev2);
  40331   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40332   return __ret;
  40333 }
  40334 #endif
  40335 
  40336 #ifdef __LITTLE_ENDIAN__
  40337 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su0q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40338   uint32x4_t __ret;
  40339   __ret = (uint32x4_t) __builtin_neon_vsha1su0q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  40340   return __ret;
  40341 }
  40342 #else
  40343 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su0q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40344   uint32x4_t __ret;
  40345   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40346   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40347   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40348   __ret = (uint32x4_t) __builtin_neon_vsha1su0q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  40349   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40350   return __ret;
  40351 }
  40352 #endif
  40353 
  40354 #ifdef __LITTLE_ENDIAN__
  40355 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  40356   uint32x4_t __ret;
  40357   __ret = (uint32x4_t) __builtin_neon_vsha1su1q_u32((int8x16_t)__p0, (int8x16_t)__p1, 50);
  40358   return __ret;
  40359 }
  40360 #else
  40361 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  40362   uint32x4_t __ret;
  40363   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40364   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40365   __ret = (uint32x4_t) __builtin_neon_vsha1su1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  40366   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40367   return __ret;
  40368 }
  40369 #endif
  40370 
  40371 #ifdef __LITTLE_ENDIAN__
  40372 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256hq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40373   uint32x4_t __ret;
  40374   __ret = (uint32x4_t) __builtin_neon_vsha256hq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  40375   return __ret;
  40376 }
  40377 #else
  40378 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256hq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40379   uint32x4_t __ret;
  40380   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40381   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40382   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40383   __ret = (uint32x4_t) __builtin_neon_vsha256hq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  40384   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40385   return __ret;
  40386 }
  40387 #endif
  40388 
  40389 #ifdef __LITTLE_ENDIAN__
  40390 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256h2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40391   uint32x4_t __ret;
  40392   __ret = (uint32x4_t) __builtin_neon_vsha256h2q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  40393   return __ret;
  40394 }
  40395 #else
  40396 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256h2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40397   uint32x4_t __ret;
  40398   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40399   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40400   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40401   __ret = (uint32x4_t) __builtin_neon_vsha256h2q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  40402   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40403   return __ret;
  40404 }
  40405 #endif
  40406 
  40407 #ifdef __LITTLE_ENDIAN__
  40408 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su0q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  40409   uint32x4_t __ret;
  40410   __ret = (uint32x4_t) __builtin_neon_vsha256su0q_u32((int8x16_t)__p0, (int8x16_t)__p1, 50);
  40411   return __ret;
  40412 }
  40413 #else
  40414 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su0q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  40415   uint32x4_t __ret;
  40416   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40417   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40418   __ret = (uint32x4_t) __builtin_neon_vsha256su0q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  40419   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40420   return __ret;
  40421 }
  40422 #endif
  40423 
  40424 #ifdef __LITTLE_ENDIAN__
  40425 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40426   uint32x4_t __ret;
  40427   __ret = (uint32x4_t) __builtin_neon_vsha256su1q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  40428   return __ret;
  40429 }
  40430 #else
  40431 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  40432   uint32x4_t __ret;
  40433   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40434   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40435   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  40436   __ret = (uint32x4_t) __builtin_neon_vsha256su1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  40437   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40438   return __ret;
  40439 }
  40440 #endif
  40441 
  40442 #endif
  40443 #if __ARM_ARCH >= 8 && defined(__ARM_FEATURE_DIRECTED_ROUNDING)
  40444 #ifdef __LITTLE_ENDIAN__
  40445 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndq_f16(float16x8_t __p0) {
  40446   float16x8_t __ret;
  40447   __ret = (float16x8_t) __builtin_neon_vrndq_f16((int8x16_t)__p0, 40);
  40448   return __ret;
  40449 }
  40450 #else
  40451 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndq_f16(float16x8_t __p0) {
  40452   float16x8_t __ret;
  40453   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40454   __ret = (float16x8_t) __builtin_neon_vrndq_f16((int8x16_t)__rev0, 40);
  40455   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40456   return __ret;
  40457 }
  40458 #endif
  40459 
  40460 #ifdef __LITTLE_ENDIAN__
  40461 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnd_f16(float16x4_t __p0) {
  40462   float16x4_t __ret;
  40463   __ret = (float16x4_t) __builtin_neon_vrnd_f16((int8x8_t)__p0, 8);
  40464   return __ret;
  40465 }
  40466 #else
  40467 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnd_f16(float16x4_t __p0) {
  40468   float16x4_t __ret;
  40469   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40470   __ret = (float16x4_t) __builtin_neon_vrnd_f16((int8x8_t)__rev0, 8);
  40471   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40472   return __ret;
  40473 }
  40474 #endif
  40475 
  40476 #ifdef __LITTLE_ENDIAN__
  40477 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndaq_f16(float16x8_t __p0) {
  40478   float16x8_t __ret;
  40479   __ret = (float16x8_t) __builtin_neon_vrndaq_f16((int8x16_t)__p0, 40);
  40480   return __ret;
  40481 }
  40482 #else
  40483 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndaq_f16(float16x8_t __p0) {
  40484   float16x8_t __ret;
  40485   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40486   __ret = (float16x8_t) __builtin_neon_vrndaq_f16((int8x16_t)__rev0, 40);
  40487   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40488   return __ret;
  40489 }
  40490 #endif
  40491 
  40492 #ifdef __LITTLE_ENDIAN__
  40493 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnda_f16(float16x4_t __p0) {
  40494   float16x4_t __ret;
  40495   __ret = (float16x4_t) __builtin_neon_vrnda_f16((int8x8_t)__p0, 8);
  40496   return __ret;
  40497 }
  40498 #else
  40499 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnda_f16(float16x4_t __p0) {
  40500   float16x4_t __ret;
  40501   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40502   __ret = (float16x4_t) __builtin_neon_vrnda_f16((int8x8_t)__rev0, 8);
  40503   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40504   return __ret;
  40505 }
  40506 #endif
  40507 
  40508 #ifdef __LITTLE_ENDIAN__
  40509 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndmq_f16(float16x8_t __p0) {
  40510   float16x8_t __ret;
  40511   __ret = (float16x8_t) __builtin_neon_vrndmq_f16((int8x16_t)__p0, 40);
  40512   return __ret;
  40513 }
  40514 #else
  40515 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndmq_f16(float16x8_t __p0) {
  40516   float16x8_t __ret;
  40517   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40518   __ret = (float16x8_t) __builtin_neon_vrndmq_f16((int8x16_t)__rev0, 40);
  40519   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40520   return __ret;
  40521 }
  40522 #endif
  40523 
  40524 #ifdef __LITTLE_ENDIAN__
  40525 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndm_f16(float16x4_t __p0) {
  40526   float16x4_t __ret;
  40527   __ret = (float16x4_t) __builtin_neon_vrndm_f16((int8x8_t)__p0, 8);
  40528   return __ret;
  40529 }
  40530 #else
  40531 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndm_f16(float16x4_t __p0) {
  40532   float16x4_t __ret;
  40533   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40534   __ret = (float16x4_t) __builtin_neon_vrndm_f16((int8x8_t)__rev0, 8);
  40535   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40536   return __ret;
  40537 }
  40538 #endif
  40539 
  40540 #ifdef __LITTLE_ENDIAN__
  40541 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndnq_f16(float16x8_t __p0) {
  40542   float16x8_t __ret;
  40543   __ret = (float16x8_t) __builtin_neon_vrndnq_f16((int8x16_t)__p0, 40);
  40544   return __ret;
  40545 }
  40546 #else
  40547 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndnq_f16(float16x8_t __p0) {
  40548   float16x8_t __ret;
  40549   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40550   __ret = (float16x8_t) __builtin_neon_vrndnq_f16((int8x16_t)__rev0, 40);
  40551   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40552   return __ret;
  40553 }
  40554 #endif
  40555 
  40556 #ifdef __LITTLE_ENDIAN__
  40557 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndn_f16(float16x4_t __p0) {
  40558   float16x4_t __ret;
  40559   __ret = (float16x4_t) __builtin_neon_vrndn_f16((int8x8_t)__p0, 8);
  40560   return __ret;
  40561 }
  40562 #else
  40563 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndn_f16(float16x4_t __p0) {
  40564   float16x4_t __ret;
  40565   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40566   __ret = (float16x4_t) __builtin_neon_vrndn_f16((int8x8_t)__rev0, 8);
  40567   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40568   return __ret;
  40569 }
  40570 #endif
  40571 
  40572 #ifdef __LITTLE_ENDIAN__
  40573 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndpq_f16(float16x8_t __p0) {
  40574   float16x8_t __ret;
  40575   __ret = (float16x8_t) __builtin_neon_vrndpq_f16((int8x16_t)__p0, 40);
  40576   return __ret;
  40577 }
  40578 #else
  40579 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndpq_f16(float16x8_t __p0) {
  40580   float16x8_t __ret;
  40581   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40582   __ret = (float16x8_t) __builtin_neon_vrndpq_f16((int8x16_t)__rev0, 40);
  40583   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40584   return __ret;
  40585 }
  40586 #endif
  40587 
  40588 #ifdef __LITTLE_ENDIAN__
  40589 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndp_f16(float16x4_t __p0) {
  40590   float16x4_t __ret;
  40591   __ret = (float16x4_t) __builtin_neon_vrndp_f16((int8x8_t)__p0, 8);
  40592   return __ret;
  40593 }
  40594 #else
  40595 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndp_f16(float16x4_t __p0) {
  40596   float16x4_t __ret;
  40597   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40598   __ret = (float16x4_t) __builtin_neon_vrndp_f16((int8x8_t)__rev0, 8);
  40599   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40600   return __ret;
  40601 }
  40602 #endif
  40603 
  40604 #ifdef __LITTLE_ENDIAN__
  40605 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndxq_f16(float16x8_t __p0) {
  40606   float16x8_t __ret;
  40607   __ret = (float16x8_t) __builtin_neon_vrndxq_f16((int8x16_t)__p0, 40);
  40608   return __ret;
  40609 }
  40610 #else
  40611 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndxq_f16(float16x8_t __p0) {
  40612   float16x8_t __ret;
  40613   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40614   __ret = (float16x8_t) __builtin_neon_vrndxq_f16((int8x16_t)__rev0, 40);
  40615   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40616   return __ret;
  40617 }
  40618 #endif
  40619 
  40620 #ifdef __LITTLE_ENDIAN__
  40621 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndx_f16(float16x4_t __p0) {
  40622   float16x4_t __ret;
  40623   __ret = (float16x4_t) __builtin_neon_vrndx_f16((int8x8_t)__p0, 8);
  40624   return __ret;
  40625 }
  40626 #else
  40627 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndx_f16(float16x4_t __p0) {
  40628   float16x4_t __ret;
  40629   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40630   __ret = (float16x4_t) __builtin_neon_vrndx_f16((int8x8_t)__rev0, 8);
  40631   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40632   return __ret;
  40633 }
  40634 #endif
  40635 
  40636 #ifdef __LITTLE_ENDIAN__
  40637 __ai __attribute__((target("neon"))) float32x4_t vrndq_f32(float32x4_t __p0) {
  40638   float32x4_t __ret;
  40639   __ret = (float32x4_t) __builtin_neon_vrndq_v((int8x16_t)__p0, 41);
  40640   return __ret;
  40641 }
  40642 #else
  40643 __ai __attribute__((target("neon"))) float32x4_t vrndq_f32(float32x4_t __p0) {
  40644   float32x4_t __ret;
  40645   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40646   __ret = (float32x4_t) __builtin_neon_vrndq_v((int8x16_t)__rev0, 41);
  40647   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40648   return __ret;
  40649 }
  40650 #endif
  40651 
  40652 #ifdef __LITTLE_ENDIAN__
  40653 __ai __attribute__((target("neon"))) float32x2_t vrnd_f32(float32x2_t __p0) {
  40654   float32x2_t __ret;
  40655   __ret = (float32x2_t) __builtin_neon_vrnd_v((int8x8_t)__p0, 9);
  40656   return __ret;
  40657 }
  40658 #else
  40659 __ai __attribute__((target("neon"))) float32x2_t vrnd_f32(float32x2_t __p0) {
  40660   float32x2_t __ret;
  40661   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40662   __ret = (float32x2_t) __builtin_neon_vrnd_v((int8x8_t)__rev0, 9);
  40663   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40664   return __ret;
  40665 }
  40666 #endif
  40667 
  40668 #ifdef __LITTLE_ENDIAN__
  40669 __ai __attribute__((target("neon"))) float32x4_t vrndaq_f32(float32x4_t __p0) {
  40670   float32x4_t __ret;
  40671   __ret = (float32x4_t) __builtin_neon_vrndaq_v((int8x16_t)__p0, 41);
  40672   return __ret;
  40673 }
  40674 #else
  40675 __ai __attribute__((target("neon"))) float32x4_t vrndaq_f32(float32x4_t __p0) {
  40676   float32x4_t __ret;
  40677   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40678   __ret = (float32x4_t) __builtin_neon_vrndaq_v((int8x16_t)__rev0, 41);
  40679   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40680   return __ret;
  40681 }
  40682 #endif
  40683 
  40684 #ifdef __LITTLE_ENDIAN__
  40685 __ai __attribute__((target("neon"))) float32x2_t vrnda_f32(float32x2_t __p0) {
  40686   float32x2_t __ret;
  40687   __ret = (float32x2_t) __builtin_neon_vrnda_v((int8x8_t)__p0, 9);
  40688   return __ret;
  40689 }
  40690 #else
  40691 __ai __attribute__((target("neon"))) float32x2_t vrnda_f32(float32x2_t __p0) {
  40692   float32x2_t __ret;
  40693   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40694   __ret = (float32x2_t) __builtin_neon_vrnda_v((int8x8_t)__rev0, 9);
  40695   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40696   return __ret;
  40697 }
  40698 #endif
  40699 
  40700 #ifdef __LITTLE_ENDIAN__
  40701 __ai __attribute__((target("neon"))) float32x4_t vrndiq_f32(float32x4_t __p0) {
  40702   float32x4_t __ret;
  40703   __ret = (float32x4_t) __builtin_neon_vrndiq_v((int8x16_t)__p0, 41);
  40704   return __ret;
  40705 }
  40706 #else
  40707 __ai __attribute__((target("neon"))) float32x4_t vrndiq_f32(float32x4_t __p0) {
  40708   float32x4_t __ret;
  40709   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40710   __ret = (float32x4_t) __builtin_neon_vrndiq_v((int8x16_t)__rev0, 41);
  40711   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40712   return __ret;
  40713 }
  40714 #endif
  40715 
  40716 #ifdef __LITTLE_ENDIAN__
  40717 __ai __attribute__((target("neon"))) float32x2_t vrndi_f32(float32x2_t __p0) {
  40718   float32x2_t __ret;
  40719   __ret = (float32x2_t) __builtin_neon_vrndi_v((int8x8_t)__p0, 9);
  40720   return __ret;
  40721 }
  40722 #else
  40723 __ai __attribute__((target("neon"))) float32x2_t vrndi_f32(float32x2_t __p0) {
  40724   float32x2_t __ret;
  40725   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40726   __ret = (float32x2_t) __builtin_neon_vrndi_v((int8x8_t)__rev0, 9);
  40727   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40728   return __ret;
  40729 }
  40730 #endif
  40731 
  40732 #ifdef __LITTLE_ENDIAN__
  40733 __ai __attribute__((target("neon"))) float32x4_t vrndmq_f32(float32x4_t __p0) {
  40734   float32x4_t __ret;
  40735   __ret = (float32x4_t) __builtin_neon_vrndmq_v((int8x16_t)__p0, 41);
  40736   return __ret;
  40737 }
  40738 #else
  40739 __ai __attribute__((target("neon"))) float32x4_t vrndmq_f32(float32x4_t __p0) {
  40740   float32x4_t __ret;
  40741   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40742   __ret = (float32x4_t) __builtin_neon_vrndmq_v((int8x16_t)__rev0, 41);
  40743   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40744   return __ret;
  40745 }
  40746 #endif
  40747 
  40748 #ifdef __LITTLE_ENDIAN__
  40749 __ai __attribute__((target("neon"))) float32x2_t vrndm_f32(float32x2_t __p0) {
  40750   float32x2_t __ret;
  40751   __ret = (float32x2_t) __builtin_neon_vrndm_v((int8x8_t)__p0, 9);
  40752   return __ret;
  40753 }
  40754 #else
  40755 __ai __attribute__((target("neon"))) float32x2_t vrndm_f32(float32x2_t __p0) {
  40756   float32x2_t __ret;
  40757   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40758   __ret = (float32x2_t) __builtin_neon_vrndm_v((int8x8_t)__rev0, 9);
  40759   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40760   return __ret;
  40761 }
  40762 #endif
  40763 
  40764 #ifdef __LITTLE_ENDIAN__
  40765 __ai __attribute__((target("neon"))) float32x4_t vrndnq_f32(float32x4_t __p0) {
  40766   float32x4_t __ret;
  40767   __ret = (float32x4_t) __builtin_neon_vrndnq_v((int8x16_t)__p0, 41);
  40768   return __ret;
  40769 }
  40770 #else
  40771 __ai __attribute__((target("neon"))) float32x4_t vrndnq_f32(float32x4_t __p0) {
  40772   float32x4_t __ret;
  40773   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40774   __ret = (float32x4_t) __builtin_neon_vrndnq_v((int8x16_t)__rev0, 41);
  40775   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40776   return __ret;
  40777 }
  40778 #endif
  40779 
  40780 #ifdef __LITTLE_ENDIAN__
  40781 __ai __attribute__((target("neon"))) float32x2_t vrndn_f32(float32x2_t __p0) {
  40782   float32x2_t __ret;
  40783   __ret = (float32x2_t) __builtin_neon_vrndn_v((int8x8_t)__p0, 9);
  40784   return __ret;
  40785 }
  40786 #else
  40787 __ai __attribute__((target("neon"))) float32x2_t vrndn_f32(float32x2_t __p0) {
  40788   float32x2_t __ret;
  40789   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40790   __ret = (float32x2_t) __builtin_neon_vrndn_v((int8x8_t)__rev0, 9);
  40791   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40792   return __ret;
  40793 }
  40794 #endif
  40795 
  40796 __ai __attribute__((target("neon"))) float32_t vrndns_f32(float32_t __p0) {
  40797   float32_t __ret;
  40798   __ret = (float32_t) __builtin_neon_vrndns_f32(__p0);
  40799   return __ret;
  40800 }
  40801 #ifdef __LITTLE_ENDIAN__
  40802 __ai __attribute__((target("neon"))) float32x4_t vrndpq_f32(float32x4_t __p0) {
  40803   float32x4_t __ret;
  40804   __ret = (float32x4_t) __builtin_neon_vrndpq_v((int8x16_t)__p0, 41);
  40805   return __ret;
  40806 }
  40807 #else
  40808 __ai __attribute__((target("neon"))) float32x4_t vrndpq_f32(float32x4_t __p0) {
  40809   float32x4_t __ret;
  40810   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40811   __ret = (float32x4_t) __builtin_neon_vrndpq_v((int8x16_t)__rev0, 41);
  40812   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40813   return __ret;
  40814 }
  40815 #endif
  40816 
  40817 #ifdef __LITTLE_ENDIAN__
  40818 __ai __attribute__((target("neon"))) float32x2_t vrndp_f32(float32x2_t __p0) {
  40819   float32x2_t __ret;
  40820   __ret = (float32x2_t) __builtin_neon_vrndp_v((int8x8_t)__p0, 9);
  40821   return __ret;
  40822 }
  40823 #else
  40824 __ai __attribute__((target("neon"))) float32x2_t vrndp_f32(float32x2_t __p0) {
  40825   float32x2_t __ret;
  40826   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40827   __ret = (float32x2_t) __builtin_neon_vrndp_v((int8x8_t)__rev0, 9);
  40828   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40829   return __ret;
  40830 }
  40831 #endif
  40832 
  40833 #ifdef __LITTLE_ENDIAN__
  40834 __ai __attribute__((target("neon"))) float32x4_t vrndxq_f32(float32x4_t __p0) {
  40835   float32x4_t __ret;
  40836   __ret = (float32x4_t) __builtin_neon_vrndxq_v((int8x16_t)__p0, 41);
  40837   return __ret;
  40838 }
  40839 #else
  40840 __ai __attribute__((target("neon"))) float32x4_t vrndxq_f32(float32x4_t __p0) {
  40841   float32x4_t __ret;
  40842   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40843   __ret = (float32x4_t) __builtin_neon_vrndxq_v((int8x16_t)__rev0, 41);
  40844   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40845   return __ret;
  40846 }
  40847 #endif
  40848 
  40849 #ifdef __LITTLE_ENDIAN__
  40850 __ai __attribute__((target("neon"))) float32x2_t vrndx_f32(float32x2_t __p0) {
  40851   float32x2_t __ret;
  40852   __ret = (float32x2_t) __builtin_neon_vrndx_v((int8x8_t)__p0, 9);
  40853   return __ret;
  40854 }
  40855 #else
  40856 __ai __attribute__((target("neon"))) float32x2_t vrndx_f32(float32x2_t __p0) {
  40857   float32x2_t __ret;
  40858   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40859   __ret = (float32x2_t) __builtin_neon_vrndx_v((int8x8_t)__rev0, 9);
  40860   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40861   return __ret;
  40862 }
  40863 #endif
  40864 
  40865 #endif
  40866 #if __ARM_ARCH >= 8 && defined(__ARM_FEATURE_NUMERIC_MAXMIN)
  40867 #ifdef __LITTLE_ENDIAN__
  40868 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  40869   float16x8_t __ret;
  40870   __ret = (float16x8_t) __builtin_neon_vmaxnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  40871   return __ret;
  40872 }
  40873 #else
  40874 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  40875   float16x8_t __ret;
  40876   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40877   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  40878   __ret = (float16x8_t) __builtin_neon_vmaxnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  40879   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40880   return __ret;
  40881 }
  40882 #endif
  40883 
  40884 #ifdef __LITTLE_ENDIAN__
  40885 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmaxnm_f16(float16x4_t __p0, float16x4_t __p1) {
  40886   float16x4_t __ret;
  40887   __ret = (float16x4_t) __builtin_neon_vmaxnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  40888   return __ret;
  40889 }
  40890 #else
  40891 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmaxnm_f16(float16x4_t __p0, float16x4_t __p1) {
  40892   float16x4_t __ret;
  40893   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40894   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40895   __ret = (float16x4_t) __builtin_neon_vmaxnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  40896   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40897   return __ret;
  40898 }
  40899 #endif
  40900 
  40901 #ifdef __LITTLE_ENDIAN__
  40902 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  40903   float16x8_t __ret;
  40904   __ret = (float16x8_t) __builtin_neon_vminnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  40905   return __ret;
  40906 }
  40907 #else
  40908 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  40909   float16x8_t __ret;
  40910   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  40911   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  40912   __ret = (float16x8_t) __builtin_neon_vminnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  40913   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  40914   return __ret;
  40915 }
  40916 #endif
  40917 
  40918 #ifdef __LITTLE_ENDIAN__
  40919 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vminnm_f16(float16x4_t __p0, float16x4_t __p1) {
  40920   float16x4_t __ret;
  40921   __ret = (float16x4_t) __builtin_neon_vminnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  40922   return __ret;
  40923 }
  40924 #else
  40925 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vminnm_f16(float16x4_t __p0, float16x4_t __p1) {
  40926   float16x4_t __ret;
  40927   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40928   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40929   __ret = (float16x4_t) __builtin_neon_vminnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  40930   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40931   return __ret;
  40932 }
  40933 #endif
  40934 
  40935 #ifdef __LITTLE_ENDIAN__
  40936 __ai __attribute__((target("neon"))) float32x4_t vmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  40937   float32x4_t __ret;
  40938   __ret = (float32x4_t) __builtin_neon_vmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  40939   return __ret;
  40940 }
  40941 #else
  40942 __ai __attribute__((target("neon"))) float32x4_t vmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  40943   float32x4_t __ret;
  40944   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40945   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40946   __ret = (float32x4_t) __builtin_neon_vmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  40947   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40948   return __ret;
  40949 }
  40950 #endif
  40951 
  40952 #ifdef __LITTLE_ENDIAN__
  40953 __ai __attribute__((target("neon"))) float32x2_t vmaxnm_f32(float32x2_t __p0, float32x2_t __p1) {
  40954   float32x2_t __ret;
  40955   __ret = (float32x2_t) __builtin_neon_vmaxnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  40956   return __ret;
  40957 }
  40958 #else
  40959 __ai __attribute__((target("neon"))) float32x2_t vmaxnm_f32(float32x2_t __p0, float32x2_t __p1) {
  40960   float32x2_t __ret;
  40961   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40962   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  40963   __ret = (float32x2_t) __builtin_neon_vmaxnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  40964   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40965   return __ret;
  40966 }
  40967 #endif
  40968 
  40969 #ifdef __LITTLE_ENDIAN__
  40970 __ai __attribute__((target("neon"))) float32x4_t vminnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  40971   float32x4_t __ret;
  40972   __ret = (float32x4_t) __builtin_neon_vminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  40973   return __ret;
  40974 }
  40975 #else
  40976 __ai __attribute__((target("neon"))) float32x4_t vminnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  40977   float32x4_t __ret;
  40978   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  40979   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  40980   __ret = (float32x4_t) __builtin_neon_vminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  40981   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  40982   return __ret;
  40983 }
  40984 #endif
  40985 
  40986 #ifdef __LITTLE_ENDIAN__
  40987 __ai __attribute__((target("neon"))) float32x2_t vminnm_f32(float32x2_t __p0, float32x2_t __p1) {
  40988   float32x2_t __ret;
  40989   __ret = (float32x2_t) __builtin_neon_vminnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  40990   return __ret;
  40991 }
  40992 #else
  40993 __ai __attribute__((target("neon"))) float32x2_t vminnm_f32(float32x2_t __p0, float32x2_t __p1) {
  40994   float32x2_t __ret;
  40995   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  40996   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  40997   __ret = (float32x2_t) __builtin_neon_vminnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  40998   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  40999   return __ret;
  41000 }
  41001 #endif
  41002 
  41003 #endif
  41004 #if defined(__ARM_FEATURE_FMA)
  41005 #ifdef __LITTLE_ENDIAN__
  41006 __ai __attribute__((target("neon"))) float32x4_t vfmaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  41007   float32x4_t __ret;
  41008   __ret = (float32x4_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  41009   return __ret;
  41010 }
  41011 #else
  41012 __ai __attribute__((target("neon"))) float32x4_t vfmaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  41013   float32x4_t __ret;
  41014   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41015   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41016   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  41017   __ret = (float32x4_t) __builtin_neon_vfmaq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  41018   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41019   return __ret;
  41020 }
  41021 __ai __attribute__((target("neon"))) float32x4_t __noswap_vfmaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  41022   float32x4_t __ret;
  41023   __ret = (float32x4_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  41024   return __ret;
  41025 }
  41026 #endif
  41027 
  41028 #ifdef __LITTLE_ENDIAN__
  41029 __ai __attribute__((target("neon"))) float32x2_t vfma_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  41030   float32x2_t __ret;
  41031   __ret = (float32x2_t) __builtin_neon_vfma_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  41032   return __ret;
  41033 }
  41034 #else
  41035 __ai __attribute__((target("neon"))) float32x2_t vfma_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  41036   float32x2_t __ret;
  41037   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  41038   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  41039   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  41040   __ret = (float32x2_t) __builtin_neon_vfma_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  41041   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  41042   return __ret;
  41043 }
  41044 __ai __attribute__((target("neon"))) float32x2_t __noswap_vfma_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  41045   float32x2_t __ret;
  41046   __ret = (float32x2_t) __builtin_neon_vfma_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  41047   return __ret;
  41048 }
  41049 #endif
  41050 
  41051 #ifdef __LITTLE_ENDIAN__
  41052 __ai __attribute__((target("neon"))) float32x4_t vfmaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  41053   float32x4_t __ret;
  41054   __ret = vfmaq_f32(__p0, __p1, (float32x4_t) {__p2, __p2, __p2, __p2});
  41055   return __ret;
  41056 }
  41057 #else
  41058 __ai __attribute__((target("neon"))) float32x4_t vfmaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  41059   float32x4_t __ret;
  41060   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41061   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41062   __ret = __noswap_vfmaq_f32(__rev0, __rev1, (float32x4_t) {__p2, __p2, __p2, __p2});
  41063   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41064   return __ret;
  41065 }
  41066 #endif
  41067 
  41068 #ifdef __LITTLE_ENDIAN__
  41069 __ai __attribute__((target("neon"))) float32x2_t vfma_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  41070   float32x2_t __ret;
  41071   __ret = vfma_f32(__p0, __p1, (float32x2_t) {__p2, __p2});
  41072   return __ret;
  41073 }
  41074 #else
  41075 __ai __attribute__((target("neon"))) float32x2_t vfma_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  41076   float32x2_t __ret;
  41077   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  41078   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  41079   __ret = __noswap_vfma_f32(__rev0, __rev1, (float32x2_t) {__p2, __p2});
  41080   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  41081   return __ret;
  41082 }
  41083 #endif
  41084 
  41085 #ifdef __LITTLE_ENDIAN__
  41086 __ai __attribute__((target("neon"))) float32x4_t vfmsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  41087   float32x4_t __ret;
  41088   __ret = vfmaq_f32(__p0, -__p1, __p2);
  41089   return __ret;
  41090 }
  41091 #else
  41092 __ai __attribute__((target("neon"))) float32x4_t vfmsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) {
  41093   float32x4_t __ret;
  41094   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41095   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41096   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  41097   __ret = __noswap_vfmaq_f32(__rev0, -__rev1, __rev2);
  41098   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41099   return __ret;
  41100 }
  41101 #endif
  41102 
  41103 #ifdef __LITTLE_ENDIAN__
  41104 __ai __attribute__((target("neon"))) float32x2_t vfms_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  41105   float32x2_t __ret;
  41106   __ret = vfma_f32(__p0, -__p1, __p2);
  41107   return __ret;
  41108 }
  41109 #else
  41110 __ai __attribute__((target("neon"))) float32x2_t vfms_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) {
  41111   float32x2_t __ret;
  41112   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  41113   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  41114   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  41115   __ret = __noswap_vfma_f32(__rev0, -__rev1, __rev2);
  41116   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  41117   return __ret;
  41118 }
  41119 #endif
  41120 
  41121 #endif
  41122 #if defined(__aarch64__)
  41123 #ifdef __LITTLE_ENDIAN__
  41124 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41125   bfloat16x8_t __ret;
  41126   __ret = (bfloat16x8_t) __builtin_neon_vcvt1_bf16_mf8_fpm(__p0, __p1);
  41127   return __ret;
  41128 }
  41129 #else
  41130 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41131   bfloat16x8_t __ret;
  41132   mfloat8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41133   __ret = (bfloat16x8_t) __builtin_neon_vcvt1_bf16_mf8_fpm(__rev0, __p1);
  41134   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41135   return __ret;
  41136 }
  41137 #endif
  41138 
  41139 #ifdef __LITTLE_ENDIAN__
  41140 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41141   float16x8_t __ret;
  41142   __ret = (float16x8_t) __builtin_neon_vcvt1_f16_mf8_fpm(__p0, __p1);
  41143   return __ret;
  41144 }
  41145 #else
  41146 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41147   float16x8_t __ret;
  41148   mfloat8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41149   __ret = (float16x8_t) __builtin_neon_vcvt1_f16_mf8_fpm(__rev0, __p1);
  41150   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41151   return __ret;
  41152 }
  41153 #endif
  41154 
  41155 #ifdef __LITTLE_ENDIAN__
  41156 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41157   bfloat16x8_t __ret;
  41158   __ret = (bfloat16x8_t) __builtin_neon_vcvt1_high_bf16_mf8_fpm(__p0, __p1);
  41159   return __ret;
  41160 }
  41161 #else
  41162 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41163   bfloat16x8_t __ret;
  41164   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41165   __ret = (bfloat16x8_t) __builtin_neon_vcvt1_high_bf16_mf8_fpm(__rev0, __p1);
  41166   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41167   return __ret;
  41168 }
  41169 #endif
  41170 
  41171 #ifdef __LITTLE_ENDIAN__
  41172 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41173   float16x8_t __ret;
  41174   __ret = (float16x8_t) __builtin_neon_vcvt1_high_f16_mf8_fpm(__p0, __p1);
  41175   return __ret;
  41176 }
  41177 #else
  41178 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41179   float16x8_t __ret;
  41180   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41181   __ret = (float16x8_t) __builtin_neon_vcvt1_high_f16_mf8_fpm(__rev0, __p1);
  41182   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41183   return __ret;
  41184 }
  41185 #endif
  41186 
  41187 #ifdef __LITTLE_ENDIAN__
  41188 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41189   bfloat16x8_t __ret;
  41190   __ret = (bfloat16x8_t) __builtin_neon_vcvt1_low_bf16_mf8_fpm(__p0, __p1);
  41191   return __ret;
  41192 }
  41193 #else
  41194 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41195   bfloat16x8_t __ret;
  41196   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41197   __ret = (bfloat16x8_t) __builtin_neon_vcvt1_low_bf16_mf8_fpm(__rev0, __p1);
  41198   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41199   return __ret;
  41200 }
  41201 #endif
  41202 
  41203 #ifdef __LITTLE_ENDIAN__
  41204 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41205   float16x8_t __ret;
  41206   __ret = (float16x8_t) __builtin_neon_vcvt1_low_f16_mf8_fpm(__p0, __p1);
  41207   return __ret;
  41208 }
  41209 #else
  41210 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41211   float16x8_t __ret;
  41212   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41213   __ret = (float16x8_t) __builtin_neon_vcvt1_low_f16_mf8_fpm(__rev0, __p1);
  41214   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41215   return __ret;
  41216 }
  41217 #endif
  41218 
  41219 #ifdef __LITTLE_ENDIAN__
  41220 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41221   bfloat16x8_t __ret;
  41222   __ret = (bfloat16x8_t) __builtin_neon_vcvt2_bf16_mf8_fpm(__p0, __p1);
  41223   return __ret;
  41224 }
  41225 #else
  41226 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41227   bfloat16x8_t __ret;
  41228   mfloat8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41229   __ret = (bfloat16x8_t) __builtin_neon_vcvt2_bf16_mf8_fpm(__rev0, __p1);
  41230   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41231   return __ret;
  41232 }
  41233 #endif
  41234 
  41235 #ifdef __LITTLE_ENDIAN__
  41236 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41237   float16x8_t __ret;
  41238   __ret = (float16x8_t) __builtin_neon_vcvt2_f16_mf8_fpm(__p0, __p1);
  41239   return __ret;
  41240 }
  41241 #else
  41242 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) {
  41243   float16x8_t __ret;
  41244   mfloat8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41245   __ret = (float16x8_t) __builtin_neon_vcvt2_f16_mf8_fpm(__rev0, __p1);
  41246   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41247   return __ret;
  41248 }
  41249 #endif
  41250 
  41251 #ifdef __LITTLE_ENDIAN__
  41252 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41253   bfloat16x8_t __ret;
  41254   __ret = (bfloat16x8_t) __builtin_neon_vcvt2_high_bf16_mf8_fpm(__p0, __p1);
  41255   return __ret;
  41256 }
  41257 #else
  41258 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41259   bfloat16x8_t __ret;
  41260   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41261   __ret = (bfloat16x8_t) __builtin_neon_vcvt2_high_bf16_mf8_fpm(__rev0, __p1);
  41262   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41263   return __ret;
  41264 }
  41265 #endif
  41266 
  41267 #ifdef __LITTLE_ENDIAN__
  41268 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41269   float16x8_t __ret;
  41270   __ret = (float16x8_t) __builtin_neon_vcvt2_high_f16_mf8_fpm(__p0, __p1);
  41271   return __ret;
  41272 }
  41273 #else
  41274 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41275   float16x8_t __ret;
  41276   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41277   __ret = (float16x8_t) __builtin_neon_vcvt2_high_f16_mf8_fpm(__rev0, __p1);
  41278   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41279   return __ret;
  41280 }
  41281 #endif
  41282 
  41283 #ifdef __LITTLE_ENDIAN__
  41284 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41285   bfloat16x8_t __ret;
  41286   __ret = (bfloat16x8_t) __builtin_neon_vcvt2_low_bf16_mf8_fpm(__p0, __p1);
  41287   return __ret;
  41288 }
  41289 #else
  41290 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41291   bfloat16x8_t __ret;
  41292   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41293   __ret = (bfloat16x8_t) __builtin_neon_vcvt2_low_bf16_mf8_fpm(__rev0, __p1);
  41294   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41295   return __ret;
  41296 }
  41297 #endif
  41298 
  41299 #ifdef __LITTLE_ENDIAN__
  41300 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41301   float16x8_t __ret;
  41302   __ret = (float16x8_t) __builtin_neon_vcvt2_low_f16_mf8_fpm(__p0, __p1);
  41303   return __ret;
  41304 }
  41305 #else
  41306 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) {
  41307   float16x8_t __ret;
  41308   mfloat8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41309   __ret = (float16x8_t) __builtin_neon_vcvt2_low_f16_mf8_fpm(__rev0, __p1);
  41310   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41311   return __ret;
  41312 }
  41313 #endif
  41314 
  41315 #ifdef __LITTLE_ENDIAN__
  41316 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvt_high_mf8_f32_fpm(mfloat8x8_t __p0, float32x4_t __p1, float32x4_t __p2, fpm_t __p3) {
  41317   mfloat8x16_t __ret;
  41318   __ret = (mfloat8x16_t) __builtin_neon_vcvt_high_mf8_f32_fpm(__p0, __p1, __p2, __p3);
  41319   return __ret;
  41320 }
  41321 #else
  41322 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvt_high_mf8_f32_fpm(mfloat8x8_t __p0, float32x4_t __p1, float32x4_t __p2, fpm_t __p3) {
  41323   mfloat8x16_t __ret;
  41324   mfloat8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41325   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41326   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  41327   __ret = (mfloat8x16_t) __builtin_neon_vcvt_high_mf8_f32_fpm(__rev0, __rev1, __rev2, __p3);
  41328   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41329   return __ret;
  41330 }
  41331 #endif
  41332 
  41333 #ifdef __LITTLE_ENDIAN__
  41334 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvtq_mf8_f16_fpm(float16x8_t __p0, float16x8_t __p1, fpm_t __p2) {
  41335   mfloat8x16_t __ret;
  41336   __ret = (mfloat8x16_t) __builtin_neon_vcvtq_mf8_f16_fpm((int8x16_t)__p0, (int8x16_t)__p1, __p2);
  41337   return __ret;
  41338 }
  41339 #else
  41340 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvtq_mf8_f16_fpm(float16x8_t __p0, float16x8_t __p1, fpm_t __p2) {
  41341   mfloat8x16_t __ret;
  41342   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41343   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  41344   __ret = (mfloat8x16_t) __builtin_neon_vcvtq_mf8_f16_fpm((int8x16_t)__rev0, (int8x16_t)__rev1, __p2);
  41345   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41346   return __ret;
  41347 }
  41348 #endif
  41349 
  41350 #ifdef __LITTLE_ENDIAN__
  41351 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f16_fpm(float16x4_t __p0, float16x4_t __p1, fpm_t __p2) {
  41352   mfloat8x8_t __ret;
  41353   __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f16_fpm((int8x8_t)__p0, (int8x8_t)__p1, __p2);
  41354   return __ret;
  41355 }
  41356 #else
  41357 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f16_fpm(float16x4_t __p0, float16x4_t __p1, fpm_t __p2) {
  41358   mfloat8x8_t __ret;
  41359   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41360   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41361   __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f16_fpm((int8x8_t)__rev0, (int8x8_t)__rev1, __p2);
  41362   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41363   return __ret;
  41364 }
  41365 #endif
  41366 
  41367 #ifdef __LITTLE_ENDIAN__
  41368 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f32_fpm(float32x4_t __p0, float32x4_t __p1, fpm_t __p2) {
  41369   mfloat8x8_t __ret;
  41370   __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f32_fpm(__p0, __p1, __p2);
  41371   return __ret;
  41372 }
  41373 #else
  41374 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f32_fpm(float32x4_t __p0, float32x4_t __p1, fpm_t __p2) {
  41375   mfloat8x8_t __ret;
  41376   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41377   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41378   __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f32_fpm(__rev0, __rev1, __p2);
  41379   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41380   return __ret;
  41381 }
  41382 #endif
  41383 
  41384 #ifdef __LITTLE_ENDIAN__
  41385 __ai __attribute__((target("fp8,neon"))) float32x2_t vscale_f32(float32x2_t __p0, int32x2_t __p1) {
  41386   float32x2_t __ret;
  41387   __ret = (float32x2_t) __builtin_neon_vscale_f32((int8x8_t)__p0, (int8x8_t)__p1, 9);
  41388   return __ret;
  41389 }
  41390 #else
  41391 __ai __attribute__((target("fp8,neon"))) float32x2_t vscale_f32(float32x2_t __p0, int32x2_t __p1) {
  41392   float32x2_t __ret;
  41393   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  41394   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  41395   __ret = (float32x2_t) __builtin_neon_vscale_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  41396   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  41397   return __ret;
  41398 }
  41399 #endif
  41400 
  41401 #ifdef __LITTLE_ENDIAN__
  41402 __ai __attribute__((target("fp8,neon"))) float16x4_t vscale_f16(float16x4_t __p0, int16x4_t __p1) {
  41403   float16x4_t __ret;
  41404   __ret = (float16x4_t) __builtin_neon_vscale_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  41405   return __ret;
  41406 }
  41407 #else
  41408 __ai __attribute__((target("fp8,neon"))) float16x4_t vscale_f16(float16x4_t __p0, int16x4_t __p1) {
  41409   float16x4_t __ret;
  41410   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41411   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41412   __ret = (float16x4_t) __builtin_neon_vscale_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  41413   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41414   return __ret;
  41415 }
  41416 #endif
  41417 
  41418 #ifdef __LITTLE_ENDIAN__
  41419 __ai __attribute__((target("fp8,neon"))) float64x2_t vscaleq_f64(float64x2_t __p0, int64x2_t __p1) {
  41420   float64x2_t __ret;
  41421   __ret = (float64x2_t) __builtin_neon_vscaleq_f64((int8x16_t)__p0, (int8x16_t)__p1, 42);
  41422   return __ret;
  41423 }
  41424 #else
  41425 __ai __attribute__((target("fp8,neon"))) float64x2_t vscaleq_f64(float64x2_t __p0, int64x2_t __p1) {
  41426   float64x2_t __ret;
  41427   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  41428   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  41429   __ret = (float64x2_t) __builtin_neon_vscaleq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  41430   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  41431   return __ret;
  41432 }
  41433 #endif
  41434 
  41435 #ifdef __LITTLE_ENDIAN__
  41436 __ai __attribute__((target("fp8,neon"))) float32x4_t vscaleq_f32(float32x4_t __p0, int32x4_t __p1) {
  41437   float32x4_t __ret;
  41438   __ret = (float32x4_t) __builtin_neon_vscaleq_f32((int8x16_t)__p0, (int8x16_t)__p1, 41);
  41439   return __ret;
  41440 }
  41441 #else
  41442 __ai __attribute__((target("fp8,neon"))) float32x4_t vscaleq_f32(float32x4_t __p0, int32x4_t __p1) {
  41443   float32x4_t __ret;
  41444   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41445   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  41446   __ret = (float32x4_t) __builtin_neon_vscaleq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  41447   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41448   return __ret;
  41449 }
  41450 #endif
  41451 
  41452 #ifdef __LITTLE_ENDIAN__
  41453 __ai __attribute__((target("fp8,neon"))) float16x8_t vscaleq_f16(float16x8_t __p0, int16x8_t __p1) {
  41454   float16x8_t __ret;
  41455   __ret = (float16x8_t) __builtin_neon_vscaleq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  41456   return __ret;
  41457 }
  41458 #else
  41459 __ai __attribute__((target("fp8,neon"))) float16x8_t vscaleq_f16(float16x8_t __p0, int16x8_t __p1) {
  41460   float16x8_t __ret;
  41461   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41462   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  41463   __ret = (float16x8_t) __builtin_neon_vscaleq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  41464   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41465   return __ret;
  41466 }
  41467 #endif
  41468 
  41469 #ifdef __LITTLE_ENDIAN__
  41470 __ai __attribute__((target("fp8dot2,neon"))) float16x8_t vdotq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41471   float16x8_t __ret;
  41472   __ret = (float16x8_t) __builtin_neon_vdotq_f16_mf8_fpm((int8x16_t)__p0, __p1, __p2, __p3);
  41473   return __ret;
  41474 }
  41475 #else
  41476 __ai __attribute__((target("fp8dot2,neon"))) float16x8_t vdotq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41477   float16x8_t __ret;
  41478   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41479   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41480   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41481   __ret = (float16x8_t) __builtin_neon_vdotq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3);
  41482   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41483   return __ret;
  41484 }
  41485 #endif
  41486 
  41487 #ifdef __LITTLE_ENDIAN__
  41488 __ai __attribute__((target("fp8dot2,neon"))) float16x4_t vdot_f16_mf8_fpm(float16x4_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) {
  41489   float16x4_t __ret;
  41490   __ret = (float16x4_t) __builtin_neon_vdot_f16_mf8_fpm((int8x8_t)__p0, __p1, __p2, __p3);
  41491   return __ret;
  41492 }
  41493 #else
  41494 __ai __attribute__((target("fp8dot2,neon"))) float16x4_t vdot_f16_mf8_fpm(float16x4_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) {
  41495   float16x4_t __ret;
  41496   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41497   mfloat8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  41498   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  41499   __ret = (float16x4_t) __builtin_neon_vdot_f16_mf8_fpm((int8x8_t)__rev0, __rev1, __rev2, __p3);
  41500   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41501   return __ret;
  41502 }
  41503 #endif
  41504 
  41505 #ifdef __LITTLE_ENDIAN__
  41506 #define vdotq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41507   float16x8_t __ret; \
  41508   float16x8_t __s0 = __p0; \
  41509   mfloat8x16_t __s1 = __p1; \
  41510   mfloat8x8_t __s2 = __p2; \
  41511   fpm_t __s4 = __p4; \
  41512   __ret = (float16x8_t) __builtin_neon_vdotq_lane_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \
  41513   __ret; \
  41514 })
  41515 #else
  41516 #define vdotq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41517   float16x8_t __ret; \
  41518   float16x8_t __s0 = __p0; \
  41519   mfloat8x16_t __s1 = __p1; \
  41520   mfloat8x8_t __s2 = __p2; \
  41521   fpm_t __s4 = __p4; \
  41522   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  41523   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41524   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41525   __ret = (float16x8_t) __builtin_neon_vdotq_lane_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \
  41526   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  41527   __ret; \
  41528 })
  41529 #endif
  41530 
  41531 #ifdef __LITTLE_ENDIAN__
  41532 #define vdot_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41533   float16x4_t __ret; \
  41534   float16x4_t __s0 = __p0; \
  41535   mfloat8x8_t __s1 = __p1; \
  41536   mfloat8x8_t __s2 = __p2; \
  41537   fpm_t __s4 = __p4; \
  41538   __ret = (float16x4_t) __builtin_neon_vdot_lane_f16_mf8_fpm((int8x8_t)__s0, __s1, __s2, __p3, __s4); \
  41539   __ret; \
  41540 })
  41541 #else
  41542 #define vdot_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41543   float16x4_t __ret; \
  41544   float16x4_t __s0 = __p0; \
  41545   mfloat8x8_t __s1 = __p1; \
  41546   mfloat8x8_t __s2 = __p2; \
  41547   fpm_t __s4 = __p4; \
  41548   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41549   mfloat8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  41550   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41551   __ret = (float16x4_t) __builtin_neon_vdot_lane_f16_mf8_fpm((int8x8_t)__rev0, __rev1, __rev2, __p3, __s4); \
  41552   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41553   __ret; \
  41554 })
  41555 #endif
  41556 
  41557 #ifdef __LITTLE_ENDIAN__
  41558 #define vdotq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41559   float16x8_t __ret; \
  41560   float16x8_t __s0 = __p0; \
  41561   mfloat8x16_t __s1 = __p1; \
  41562   mfloat8x16_t __s2 = __p2; \
  41563   fpm_t __s4 = __p4; \
  41564   __ret = (float16x8_t) __builtin_neon_vdotq_laneq_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \
  41565   __ret; \
  41566 })
  41567 #else
  41568 #define vdotq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41569   float16x8_t __ret; \
  41570   float16x8_t __s0 = __p0; \
  41571   mfloat8x16_t __s1 = __p1; \
  41572   mfloat8x16_t __s2 = __p2; \
  41573   fpm_t __s4 = __p4; \
  41574   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  41575   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41576   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41577   __ret = (float16x8_t) __builtin_neon_vdotq_laneq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \
  41578   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  41579   __ret; \
  41580 })
  41581 #endif
  41582 
  41583 #ifdef __LITTLE_ENDIAN__
  41584 #define vdot_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41585   float16x4_t __ret; \
  41586   float16x4_t __s0 = __p0; \
  41587   mfloat8x8_t __s1 = __p1; \
  41588   mfloat8x16_t __s2 = __p2; \
  41589   fpm_t __s4 = __p4; \
  41590   __ret = (float16x4_t) __builtin_neon_vdot_laneq_f16_mf8_fpm((int8x8_t)__s0, __s1, __s2, __p3, __s4); \
  41591   __ret; \
  41592 })
  41593 #else
  41594 #define vdot_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41595   float16x4_t __ret; \
  41596   float16x4_t __s0 = __p0; \
  41597   mfloat8x8_t __s1 = __p1; \
  41598   mfloat8x16_t __s2 = __p2; \
  41599   fpm_t __s4 = __p4; \
  41600   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41601   mfloat8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  41602   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41603   __ret = (float16x4_t) __builtin_neon_vdot_laneq_f16_mf8_fpm((int8x8_t)__rev0, __rev1, __rev2, __p3, __s4); \
  41604   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41605   __ret; \
  41606 })
  41607 #endif
  41608 
  41609 #ifdef __LITTLE_ENDIAN__
  41610 __ai __attribute__((target("fp8dot4,neon"))) float32x4_t vdotq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41611   float32x4_t __ret;
  41612   __ret = (float32x4_t) __builtin_neon_vdotq_f32_mf8_fpm(__p0, __p1, __p2, __p3);
  41613   return __ret;
  41614 }
  41615 #else
  41616 __ai __attribute__((target("fp8dot4,neon"))) float32x4_t vdotq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41617   float32x4_t __ret;
  41618   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41619   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41620   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41621   __ret = (float32x4_t) __builtin_neon_vdotq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3);
  41622   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41623   return __ret;
  41624 }
  41625 #endif
  41626 
  41627 #ifdef __LITTLE_ENDIAN__
  41628 __ai __attribute__((target("fp8dot4,neon"))) float32x2_t vdot_f32_mf8_fpm(float32x2_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) {
  41629   float32x2_t __ret;
  41630   __ret = (float32x2_t) __builtin_neon_vdot_f32_mf8_fpm(__p0, __p1, __p2, __p3);
  41631   return __ret;
  41632 }
  41633 #else
  41634 __ai __attribute__((target("fp8dot4,neon"))) float32x2_t vdot_f32_mf8_fpm(float32x2_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) {
  41635   float32x2_t __ret;
  41636   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  41637   mfloat8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  41638   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  41639   __ret = (float32x2_t) __builtin_neon_vdot_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3);
  41640   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  41641   return __ret;
  41642 }
  41643 #endif
  41644 
  41645 #ifdef __LITTLE_ENDIAN__
  41646 #define vdotq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41647   float32x4_t __ret; \
  41648   float32x4_t __s0 = __p0; \
  41649   mfloat8x16_t __s1 = __p1; \
  41650   mfloat8x8_t __s2 = __p2; \
  41651   fpm_t __s4 = __p4; \
  41652   __ret = (float32x4_t) __builtin_neon_vdotq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41653   __ret; \
  41654 })
  41655 #else
  41656 #define vdotq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41657   float32x4_t __ret; \
  41658   float32x4_t __s0 = __p0; \
  41659   mfloat8x16_t __s1 = __p1; \
  41660   mfloat8x8_t __s2 = __p2; \
  41661   fpm_t __s4 = __p4; \
  41662   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41663   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41664   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41665   __ret = (float32x4_t) __builtin_neon_vdotq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41666   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41667   __ret; \
  41668 })
  41669 #endif
  41670 
  41671 #ifdef __LITTLE_ENDIAN__
  41672 #define vdot_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41673   float32x2_t __ret; \
  41674   float32x2_t __s0 = __p0; \
  41675   mfloat8x8_t __s1 = __p1; \
  41676   mfloat8x8_t __s2 = __p2; \
  41677   fpm_t __s4 = __p4; \
  41678   __ret = (float32x2_t) __builtin_neon_vdot_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41679   __ret; \
  41680 })
  41681 #else
  41682 #define vdot_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41683   float32x2_t __ret; \
  41684   float32x2_t __s0 = __p0; \
  41685   mfloat8x8_t __s1 = __p1; \
  41686   mfloat8x8_t __s2 = __p2; \
  41687   fpm_t __s4 = __p4; \
  41688   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  41689   mfloat8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  41690   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41691   __ret = (float32x2_t) __builtin_neon_vdot_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41692   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  41693   __ret; \
  41694 })
  41695 #endif
  41696 
  41697 #ifdef __LITTLE_ENDIAN__
  41698 #define vdotq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41699   float32x4_t __ret; \
  41700   float32x4_t __s0 = __p0; \
  41701   mfloat8x16_t __s1 = __p1; \
  41702   mfloat8x16_t __s2 = __p2; \
  41703   fpm_t __s4 = __p4; \
  41704   __ret = (float32x4_t) __builtin_neon_vdotq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41705   __ret; \
  41706 })
  41707 #else
  41708 #define vdotq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41709   float32x4_t __ret; \
  41710   float32x4_t __s0 = __p0; \
  41711   mfloat8x16_t __s1 = __p1; \
  41712   mfloat8x16_t __s2 = __p2; \
  41713   fpm_t __s4 = __p4; \
  41714   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41715   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41716   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41717   __ret = (float32x4_t) __builtin_neon_vdotq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41718   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41719   __ret; \
  41720 })
  41721 #endif
  41722 
  41723 #ifdef __LITTLE_ENDIAN__
  41724 #define vdot_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41725   float32x2_t __ret; \
  41726   float32x2_t __s0 = __p0; \
  41727   mfloat8x8_t __s1 = __p1; \
  41728   mfloat8x16_t __s2 = __p2; \
  41729   fpm_t __s4 = __p4; \
  41730   __ret = (float32x2_t) __builtin_neon_vdot_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41731   __ret; \
  41732 })
  41733 #else
  41734 #define vdot_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41735   float32x2_t __ret; \
  41736   float32x2_t __s0 = __p0; \
  41737   mfloat8x8_t __s1 = __p1; \
  41738   mfloat8x16_t __s2 = __p2; \
  41739   fpm_t __s4 = __p4; \
  41740   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  41741   mfloat8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  41742   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41743   __ret = (float32x2_t) __builtin_neon_vdot_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41744   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  41745   __ret; \
  41746 })
  41747 #endif
  41748 
  41749 #ifdef __LITTLE_ENDIAN__
  41750 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlalbq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41751   float16x8_t __ret;
  41752   __ret = (float16x8_t) __builtin_neon_vmlalbq_f16_mf8_fpm((int8x16_t)__p0, __p1, __p2, __p3);
  41753   return __ret;
  41754 }
  41755 #else
  41756 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlalbq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41757   float16x8_t __ret;
  41758   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  41759   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41760   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41761   __ret = (float16x8_t) __builtin_neon_vmlalbq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3);
  41762   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  41763   return __ret;
  41764 }
  41765 #endif
  41766 
  41767 #ifdef __LITTLE_ENDIAN__
  41768 #define vmlalbq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41769   float16x8_t __ret; \
  41770   float16x8_t __s0 = __p0; \
  41771   mfloat8x16_t __s1 = __p1; \
  41772   mfloat8x8_t __s2 = __p2; \
  41773   fpm_t __s4 = __p4; \
  41774   __ret = (float16x8_t) __builtin_neon_vmlalbq_lane_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \
  41775   __ret; \
  41776 })
  41777 #else
  41778 #define vmlalbq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41779   float16x8_t __ret; \
  41780   float16x8_t __s0 = __p0; \
  41781   mfloat8x16_t __s1 = __p1; \
  41782   mfloat8x8_t __s2 = __p2; \
  41783   fpm_t __s4 = __p4; \
  41784   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  41785   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41786   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41787   __ret = (float16x8_t) __builtin_neon_vmlalbq_lane_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \
  41788   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  41789   __ret; \
  41790 })
  41791 #endif
  41792 
  41793 #ifdef __LITTLE_ENDIAN__
  41794 #define vmlalbq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41795   float16x8_t __ret; \
  41796   float16x8_t __s0 = __p0; \
  41797   mfloat8x16_t __s1 = __p1; \
  41798   mfloat8x16_t __s2 = __p2; \
  41799   fpm_t __s4 = __p4; \
  41800   __ret = (float16x8_t) __builtin_neon_vmlalbq_laneq_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \
  41801   __ret; \
  41802 })
  41803 #else
  41804 #define vmlalbq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41805   float16x8_t __ret; \
  41806   float16x8_t __s0 = __p0; \
  41807   mfloat8x16_t __s1 = __p1; \
  41808   mfloat8x16_t __s2 = __p2; \
  41809   fpm_t __s4 = __p4; \
  41810   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  41811   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41812   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41813   __ret = (float16x8_t) __builtin_neon_vmlalbq_laneq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \
  41814   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  41815   __ret; \
  41816 })
  41817 #endif
  41818 
  41819 #ifdef __LITTLE_ENDIAN__
  41820 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41821   float32x4_t __ret;
  41822   __ret = (float32x4_t) __builtin_neon_vmlallbbq_f32_mf8_fpm(__p0, __p1, __p2, __p3);
  41823   return __ret;
  41824 }
  41825 #else
  41826 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41827   float32x4_t __ret;
  41828   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41829   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41830   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41831   __ret = (float32x4_t) __builtin_neon_vmlallbbq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3);
  41832   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41833   return __ret;
  41834 }
  41835 #endif
  41836 
  41837 #ifdef __LITTLE_ENDIAN__
  41838 #define vmlallbbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41839   float32x4_t __ret; \
  41840   float32x4_t __s0 = __p0; \
  41841   mfloat8x16_t __s1 = __p1; \
  41842   mfloat8x8_t __s2 = __p2; \
  41843   fpm_t __s4 = __p4; \
  41844   __ret = (float32x4_t) __builtin_neon_vmlallbbq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41845   __ret; \
  41846 })
  41847 #else
  41848 #define vmlallbbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41849   float32x4_t __ret; \
  41850   float32x4_t __s0 = __p0; \
  41851   mfloat8x16_t __s1 = __p1; \
  41852   mfloat8x8_t __s2 = __p2; \
  41853   fpm_t __s4 = __p4; \
  41854   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41855   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41856   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41857   __ret = (float32x4_t) __builtin_neon_vmlallbbq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41858   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41859   __ret; \
  41860 })
  41861 #endif
  41862 
  41863 #ifdef __LITTLE_ENDIAN__
  41864 #define vmlallbbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41865   float32x4_t __ret; \
  41866   float32x4_t __s0 = __p0; \
  41867   mfloat8x16_t __s1 = __p1; \
  41868   mfloat8x16_t __s2 = __p2; \
  41869   fpm_t __s4 = __p4; \
  41870   __ret = (float32x4_t) __builtin_neon_vmlallbbq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41871   __ret; \
  41872 })
  41873 #else
  41874 #define vmlallbbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41875   float32x4_t __ret; \
  41876   float32x4_t __s0 = __p0; \
  41877   mfloat8x16_t __s1 = __p1; \
  41878   mfloat8x16_t __s2 = __p2; \
  41879   fpm_t __s4 = __p4; \
  41880   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41881   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41882   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41883   __ret = (float32x4_t) __builtin_neon_vmlallbbq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41884   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41885   __ret; \
  41886 })
  41887 #endif
  41888 
  41889 #ifdef __LITTLE_ENDIAN__
  41890 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbtq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41891   float32x4_t __ret;
  41892   __ret = (float32x4_t) __builtin_neon_vmlallbtq_f32_mf8_fpm(__p0, __p1, __p2, __p3);
  41893   return __ret;
  41894 }
  41895 #else
  41896 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbtq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41897   float32x4_t __ret;
  41898   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41899   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41900   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41901   __ret = (float32x4_t) __builtin_neon_vmlallbtq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3);
  41902   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41903   return __ret;
  41904 }
  41905 #endif
  41906 
  41907 #ifdef __LITTLE_ENDIAN__
  41908 #define vmlallbtq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41909   float32x4_t __ret; \
  41910   float32x4_t __s0 = __p0; \
  41911   mfloat8x16_t __s1 = __p1; \
  41912   mfloat8x8_t __s2 = __p2; \
  41913   fpm_t __s4 = __p4; \
  41914   __ret = (float32x4_t) __builtin_neon_vmlallbtq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41915   __ret; \
  41916 })
  41917 #else
  41918 #define vmlallbtq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41919   float32x4_t __ret; \
  41920   float32x4_t __s0 = __p0; \
  41921   mfloat8x16_t __s1 = __p1; \
  41922   mfloat8x8_t __s2 = __p2; \
  41923   fpm_t __s4 = __p4; \
  41924   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41925   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41926   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41927   __ret = (float32x4_t) __builtin_neon_vmlallbtq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41928   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41929   __ret; \
  41930 })
  41931 #endif
  41932 
  41933 #ifdef __LITTLE_ENDIAN__
  41934 #define vmlallbtq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41935   float32x4_t __ret; \
  41936   float32x4_t __s0 = __p0; \
  41937   mfloat8x16_t __s1 = __p1; \
  41938   mfloat8x16_t __s2 = __p2; \
  41939   fpm_t __s4 = __p4; \
  41940   __ret = (float32x4_t) __builtin_neon_vmlallbtq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41941   __ret; \
  41942 })
  41943 #else
  41944 #define vmlallbtq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41945   float32x4_t __ret; \
  41946   float32x4_t __s0 = __p0; \
  41947   mfloat8x16_t __s1 = __p1; \
  41948   mfloat8x16_t __s2 = __p2; \
  41949   fpm_t __s4 = __p4; \
  41950   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41951   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41952   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41953   __ret = (float32x4_t) __builtin_neon_vmlallbtq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41954   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41955   __ret; \
  41956 })
  41957 #endif
  41958 
  41959 #ifdef __LITTLE_ENDIAN__
  41960 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlalltbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41961   float32x4_t __ret;
  41962   __ret = (float32x4_t) __builtin_neon_vmlalltbq_f32_mf8_fpm(__p0, __p1, __p2, __p3);
  41963   return __ret;
  41964 }
  41965 #else
  41966 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlalltbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  41967   float32x4_t __ret;
  41968   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  41969   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41970   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  41971   __ret = (float32x4_t) __builtin_neon_vmlalltbq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3);
  41972   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  41973   return __ret;
  41974 }
  41975 #endif
  41976 
  41977 #ifdef __LITTLE_ENDIAN__
  41978 #define vmlalltbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41979   float32x4_t __ret; \
  41980   float32x4_t __s0 = __p0; \
  41981   mfloat8x16_t __s1 = __p1; \
  41982   mfloat8x8_t __s2 = __p2; \
  41983   fpm_t __s4 = __p4; \
  41984   __ret = (float32x4_t) __builtin_neon_vmlalltbq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  41985   __ret; \
  41986 })
  41987 #else
  41988 #define vmlalltbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  41989   float32x4_t __ret; \
  41990   float32x4_t __s0 = __p0; \
  41991   mfloat8x16_t __s1 = __p1; \
  41992   mfloat8x8_t __s2 = __p2; \
  41993   fpm_t __s4 = __p4; \
  41994   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  41995   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  41996   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  41997   __ret = (float32x4_t) __builtin_neon_vmlalltbq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  41998   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  41999   __ret; \
  42000 })
  42001 #endif
  42002 
  42003 #ifdef __LITTLE_ENDIAN__
  42004 #define vmlalltbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42005   float32x4_t __ret; \
  42006   float32x4_t __s0 = __p0; \
  42007   mfloat8x16_t __s1 = __p1; \
  42008   mfloat8x16_t __s2 = __p2; \
  42009   fpm_t __s4 = __p4; \
  42010   __ret = (float32x4_t) __builtin_neon_vmlalltbq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  42011   __ret; \
  42012 })
  42013 #else
  42014 #define vmlalltbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42015   float32x4_t __ret; \
  42016   float32x4_t __s0 = __p0; \
  42017   mfloat8x16_t __s1 = __p1; \
  42018   mfloat8x16_t __s2 = __p2; \
  42019   fpm_t __s4 = __p4; \
  42020   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42021   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42022   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42023   __ret = (float32x4_t) __builtin_neon_vmlalltbq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  42024   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  42025   __ret; \
  42026 })
  42027 #endif
  42028 
  42029 #ifdef __LITTLE_ENDIAN__
  42030 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallttq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  42031   float32x4_t __ret;
  42032   __ret = (float32x4_t) __builtin_neon_vmlallttq_f32_mf8_fpm(__p0, __p1, __p2, __p3);
  42033   return __ret;
  42034 }
  42035 #else
  42036 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallttq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  42037   float32x4_t __ret;
  42038   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  42039   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  42040   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  42041   __ret = (float32x4_t) __builtin_neon_vmlallttq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3);
  42042   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  42043   return __ret;
  42044 }
  42045 #endif
  42046 
  42047 #ifdef __LITTLE_ENDIAN__
  42048 #define vmlallttq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42049   float32x4_t __ret; \
  42050   float32x4_t __s0 = __p0; \
  42051   mfloat8x16_t __s1 = __p1; \
  42052   mfloat8x8_t __s2 = __p2; \
  42053   fpm_t __s4 = __p4; \
  42054   __ret = (float32x4_t) __builtin_neon_vmlallttq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  42055   __ret; \
  42056 })
  42057 #else
  42058 #define vmlallttq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42059   float32x4_t __ret; \
  42060   float32x4_t __s0 = __p0; \
  42061   mfloat8x16_t __s1 = __p1; \
  42062   mfloat8x8_t __s2 = __p2; \
  42063   fpm_t __s4 = __p4; \
  42064   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42065   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42066   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  42067   __ret = (float32x4_t) __builtin_neon_vmlallttq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  42068   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  42069   __ret; \
  42070 })
  42071 #endif
  42072 
  42073 #ifdef __LITTLE_ENDIAN__
  42074 #define vmlallttq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42075   float32x4_t __ret; \
  42076   float32x4_t __s0 = __p0; \
  42077   mfloat8x16_t __s1 = __p1; \
  42078   mfloat8x16_t __s2 = __p2; \
  42079   fpm_t __s4 = __p4; \
  42080   __ret = (float32x4_t) __builtin_neon_vmlallttq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \
  42081   __ret; \
  42082 })
  42083 #else
  42084 #define vmlallttq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42085   float32x4_t __ret; \
  42086   float32x4_t __s0 = __p0; \
  42087   mfloat8x16_t __s1 = __p1; \
  42088   mfloat8x16_t __s2 = __p2; \
  42089   fpm_t __s4 = __p4; \
  42090   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42091   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42092   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42093   __ret = (float32x4_t) __builtin_neon_vmlallttq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \
  42094   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  42095   __ret; \
  42096 })
  42097 #endif
  42098 
  42099 #ifdef __LITTLE_ENDIAN__
  42100 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlaltq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  42101   float16x8_t __ret;
  42102   __ret = (float16x8_t) __builtin_neon_vmlaltq_f16_mf8_fpm((int8x16_t)__p0, __p1, __p2, __p3);
  42103   return __ret;
  42104 }
  42105 #else
  42106 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlaltq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) {
  42107   float16x8_t __ret;
  42108   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  42109   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  42110   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  42111   __ret = (float16x8_t) __builtin_neon_vmlaltq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3);
  42112   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  42113   return __ret;
  42114 }
  42115 #endif
  42116 
  42117 #ifdef __LITTLE_ENDIAN__
  42118 #define vmlaltq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42119   float16x8_t __ret; \
  42120   float16x8_t __s0 = __p0; \
  42121   mfloat8x16_t __s1 = __p1; \
  42122   mfloat8x8_t __s2 = __p2; \
  42123   fpm_t __s4 = __p4; \
  42124   __ret = (float16x8_t) __builtin_neon_vmlaltq_lane_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \
  42125   __ret; \
  42126 })
  42127 #else
  42128 #define vmlaltq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42129   float16x8_t __ret; \
  42130   float16x8_t __s0 = __p0; \
  42131   mfloat8x16_t __s1 = __p1; \
  42132   mfloat8x8_t __s2 = __p2; \
  42133   fpm_t __s4 = __p4; \
  42134   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42135   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42136   mfloat8x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  42137   __ret = (float16x8_t) __builtin_neon_vmlaltq_lane_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \
  42138   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42139   __ret; \
  42140 })
  42141 #endif
  42142 
  42143 #ifdef __LITTLE_ENDIAN__
  42144 #define vmlaltq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42145   float16x8_t __ret; \
  42146   float16x8_t __s0 = __p0; \
  42147   mfloat8x16_t __s1 = __p1; \
  42148   mfloat8x16_t __s2 = __p2; \
  42149   fpm_t __s4 = __p4; \
  42150   __ret = (float16x8_t) __builtin_neon_vmlaltq_laneq_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \
  42151   __ret; \
  42152 })
  42153 #else
  42154 #define vmlaltq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \
  42155   float16x8_t __ret; \
  42156   float16x8_t __s0 = __p0; \
  42157   mfloat8x16_t __s1 = __p1; \
  42158   mfloat8x16_t __s2 = __p2; \
  42159   fpm_t __s4 = __p4; \
  42160   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42161   mfloat8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42162   mfloat8x16_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42163   __ret = (float16x8_t) __builtin_neon_vmlaltq_laneq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \
  42164   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42165   __ret; \
  42166 })
  42167 #endif
  42168 
  42169 #ifdef __LITTLE_ENDIAN__
  42170 #define vluti2_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  42171   poly8x16_t __ret; \
  42172   poly8x8_t __s0 = __p0; \
  42173   uint8x8_t __s1 = __p1; \
  42174   __ret = (poly8x16_t) __builtin_neon_vluti2_lane_p8((int8x8_t)__s0, (int8x8_t)__s1, __p2, 36); \
  42175   __ret; \
  42176 })
  42177 #else
  42178 #define vluti2_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  42179   poly8x16_t __ret; \
  42180   poly8x8_t __s0 = __p0; \
  42181   uint8x8_t __s1 = __p1; \
  42182   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42183   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42184   __ret = (poly8x16_t) __builtin_neon_vluti2_lane_p8((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 36); \
  42185   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42186   __ret; \
  42187 })
  42188 #endif
  42189 
  42190 #ifdef __LITTLE_ENDIAN__
  42191 #define vluti2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  42192   poly8x16_t __ret; \
  42193   poly8x16_t __s0 = __p0; \
  42194   uint8x8_t __s1 = __p1; \
  42195   __ret = (poly8x16_t) __builtin_neon_vluti2q_lane_p8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 36); \
  42196   __ret; \
  42197 })
  42198 #else
  42199 #define vluti2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  42200   poly8x16_t __ret; \
  42201   poly8x16_t __s0 = __p0; \
  42202   uint8x8_t __s1 = __p1; \
  42203   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42204   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42205   __ret = (poly8x16_t) __builtin_neon_vluti2q_lane_p8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 36); \
  42206   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42207   __ret; \
  42208 })
  42209 #endif
  42210 
  42211 #ifdef __LITTLE_ENDIAN__
  42212 #define vluti2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  42213   uint8x16_t __ret; \
  42214   uint8x16_t __s0 = __p0; \
  42215   uint8x8_t __s1 = __p1; \
  42216   __ret = (uint8x16_t) __builtin_neon_vluti2q_lane_u8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 48); \
  42217   __ret; \
  42218 })
  42219 #else
  42220 #define vluti2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  42221   uint8x16_t __ret; \
  42222   uint8x16_t __s0 = __p0; \
  42223   uint8x8_t __s1 = __p1; \
  42224   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42225   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42226   __ret = (uint8x16_t) __builtin_neon_vluti2q_lane_u8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 48); \
  42227   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42228   __ret; \
  42229 })
  42230 #endif
  42231 
  42232 #ifdef __LITTLE_ENDIAN__
  42233 #define vluti2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  42234   int8x16_t __ret; \
  42235   int8x16_t __s0 = __p0; \
  42236   uint8x8_t __s1 = __p1; \
  42237   __ret = (int8x16_t) __builtin_neon_vluti2q_lane_s8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 32); \
  42238   __ret; \
  42239 })
  42240 #else
  42241 #define vluti2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  42242   int8x16_t __ret; \
  42243   int8x16_t __s0 = __p0; \
  42244   uint8x8_t __s1 = __p1; \
  42245   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42246   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42247   __ret = (int8x16_t) __builtin_neon_vluti2q_lane_s8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 32); \
  42248   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42249   __ret; \
  42250 })
  42251 #endif
  42252 
  42253 #ifdef __LITTLE_ENDIAN__
  42254 #define vluti2_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  42255   uint8x16_t __ret; \
  42256   uint8x8_t __s0 = __p0; \
  42257   uint8x8_t __s1 = __p1; \
  42258   __ret = (uint8x16_t) __builtin_neon_vluti2_lane_u8((int8x8_t)__s0, (int8x8_t)__s1, __p2, 48); \
  42259   __ret; \
  42260 })
  42261 #else
  42262 #define vluti2_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  42263   uint8x16_t __ret; \
  42264   uint8x8_t __s0 = __p0; \
  42265   uint8x8_t __s1 = __p1; \
  42266   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42267   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42268   __ret = (uint8x16_t) __builtin_neon_vluti2_lane_u8((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 48); \
  42269   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42270   __ret; \
  42271 })
  42272 #endif
  42273 
  42274 #ifdef __LITTLE_ENDIAN__
  42275 #define vluti2_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  42276   int8x16_t __ret; \
  42277   int8x8_t __s0 = __p0; \
  42278   uint8x8_t __s1 = __p1; \
  42279   __ret = (int8x16_t) __builtin_neon_vluti2_lane_s8((int8x8_t)__s0, (int8x8_t)__s1, __p2, 32); \
  42280   __ret; \
  42281 })
  42282 #else
  42283 #define vluti2_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  42284   int8x16_t __ret; \
  42285   int8x8_t __s0 = __p0; \
  42286   uint8x8_t __s1 = __p1; \
  42287   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42288   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42289   __ret = (int8x16_t) __builtin_neon_vluti2_lane_s8((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 32); \
  42290   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42291   __ret; \
  42292 })
  42293 #endif
  42294 
  42295 #ifdef __LITTLE_ENDIAN__
  42296 #define vluti2_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  42297   poly16x8_t __ret; \
  42298   poly16x4_t __s0 = __p0; \
  42299   uint8x8_t __s1 = __p1; \
  42300   __ret = (poly16x8_t) __builtin_neon_vluti2_lane_p16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 37); \
  42301   __ret; \
  42302 })
  42303 #else
  42304 #define vluti2_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  42305   poly16x8_t __ret; \
  42306   poly16x4_t __s0 = __p0; \
  42307   uint8x8_t __s1 = __p1; \
  42308   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42309   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42310   __ret = (poly16x8_t) __builtin_neon_vluti2_lane_p16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 37); \
  42311   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42312   __ret; \
  42313 })
  42314 #endif
  42315 
  42316 #ifdef __LITTLE_ENDIAN__
  42317 #define vluti2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  42318   poly16x8_t __ret; \
  42319   poly16x8_t __s0 = __p0; \
  42320   uint8x8_t __s1 = __p1; \
  42321   __ret = (poly16x8_t) __builtin_neon_vluti2q_lane_p16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 37); \
  42322   __ret; \
  42323 })
  42324 #else
  42325 #define vluti2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \
  42326   poly16x8_t __ret; \
  42327   poly16x8_t __s0 = __p0; \
  42328   uint8x8_t __s1 = __p1; \
  42329   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42330   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42331   __ret = (poly16x8_t) __builtin_neon_vluti2q_lane_p16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 37); \
  42332   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42333   __ret; \
  42334 })
  42335 #endif
  42336 
  42337 #ifdef __LITTLE_ENDIAN__
  42338 #define vluti2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  42339   uint16x8_t __ret; \
  42340   uint16x8_t __s0 = __p0; \
  42341   uint8x8_t __s1 = __p1; \
  42342   __ret = (uint16x8_t) __builtin_neon_vluti2q_lane_u16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 49); \
  42343   __ret; \
  42344 })
  42345 #else
  42346 #define vluti2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  42347   uint16x8_t __ret; \
  42348   uint16x8_t __s0 = __p0; \
  42349   uint8x8_t __s1 = __p1; \
  42350   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42351   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42352   __ret = (uint16x8_t) __builtin_neon_vluti2q_lane_u16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 49); \
  42353   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42354   __ret; \
  42355 })
  42356 #endif
  42357 
  42358 #ifdef __LITTLE_ENDIAN__
  42359 #define vluti2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  42360   float16x8_t __ret; \
  42361   float16x8_t __s0 = __p0; \
  42362   uint8x8_t __s1 = __p1; \
  42363   __ret = (float16x8_t) __builtin_neon_vluti2q_lane_f16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 40); \
  42364   __ret; \
  42365 })
  42366 #else
  42367 #define vluti2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  42368   float16x8_t __ret; \
  42369   float16x8_t __s0 = __p0; \
  42370   uint8x8_t __s1 = __p1; \
  42371   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42372   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42373   __ret = (float16x8_t) __builtin_neon_vluti2q_lane_f16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 40); \
  42374   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42375   __ret; \
  42376 })
  42377 #endif
  42378 
  42379 #ifdef __LITTLE_ENDIAN__
  42380 #define vluti2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  42381   int16x8_t __ret; \
  42382   int16x8_t __s0 = __p0; \
  42383   uint8x8_t __s1 = __p1; \
  42384   __ret = (int16x8_t) __builtin_neon_vluti2q_lane_s16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 33); \
  42385   __ret; \
  42386 })
  42387 #else
  42388 #define vluti2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  42389   int16x8_t __ret; \
  42390   int16x8_t __s0 = __p0; \
  42391   uint8x8_t __s1 = __p1; \
  42392   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42393   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42394   __ret = (int16x8_t) __builtin_neon_vluti2q_lane_s16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 33); \
  42395   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42396   __ret; \
  42397 })
  42398 #endif
  42399 
  42400 #ifdef __LITTLE_ENDIAN__
  42401 #define vluti2_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  42402   uint16x8_t __ret; \
  42403   uint16x4_t __s0 = __p0; \
  42404   uint8x8_t __s1 = __p1; \
  42405   __ret = (uint16x8_t) __builtin_neon_vluti2_lane_u16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 49); \
  42406   __ret; \
  42407 })
  42408 #else
  42409 #define vluti2_lane_u16(__p0, __p1, __p2) __extension__ ({ \
  42410   uint16x8_t __ret; \
  42411   uint16x4_t __s0 = __p0; \
  42412   uint8x8_t __s1 = __p1; \
  42413   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42414   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42415   __ret = (uint16x8_t) __builtin_neon_vluti2_lane_u16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 49); \
  42416   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42417   __ret; \
  42418 })
  42419 #endif
  42420 
  42421 #ifdef __LITTLE_ENDIAN__
  42422 #define vluti2_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  42423   float16x8_t __ret; \
  42424   float16x4_t __s0 = __p0; \
  42425   uint8x8_t __s1 = __p1; \
  42426   __ret = (float16x8_t) __builtin_neon_vluti2_lane_f16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 40); \
  42427   __ret; \
  42428 })
  42429 #else
  42430 #define vluti2_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  42431   float16x8_t __ret; \
  42432   float16x4_t __s0 = __p0; \
  42433   uint8x8_t __s1 = __p1; \
  42434   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42435   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42436   __ret = (float16x8_t) __builtin_neon_vluti2_lane_f16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 40); \
  42437   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42438   __ret; \
  42439 })
  42440 #endif
  42441 
  42442 #ifdef __LITTLE_ENDIAN__
  42443 #define vluti2_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  42444   int16x8_t __ret; \
  42445   int16x4_t __s0 = __p0; \
  42446   uint8x8_t __s1 = __p1; \
  42447   __ret = (int16x8_t) __builtin_neon_vluti2_lane_s16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 33); \
  42448   __ret; \
  42449 })
  42450 #else
  42451 #define vluti2_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  42452   int16x8_t __ret; \
  42453   int16x4_t __s0 = __p0; \
  42454   uint8x8_t __s1 = __p1; \
  42455   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42456   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42457   __ret = (int16x8_t) __builtin_neon_vluti2_lane_s16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 33); \
  42458   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42459   __ret; \
  42460 })
  42461 #endif
  42462 
  42463 #ifdef __LITTLE_ENDIAN__
  42464 #define vluti2_laneq_p8(__p0, __p1, __p2) __extension__ ({ \
  42465   poly8x16_t __ret; \
  42466   poly8x8_t __s0 = __p0; \
  42467   uint8x16_t __s1 = __p1; \
  42468   __ret = (poly8x16_t) __builtin_neon_vluti2_laneq_p8((int8x8_t)__s0, (int8x16_t)__s1, __p2, 36); \
  42469   __ret; \
  42470 })
  42471 #else
  42472 #define vluti2_laneq_p8(__p0, __p1, __p2) __extension__ ({ \
  42473   poly8x16_t __ret; \
  42474   poly8x8_t __s0 = __p0; \
  42475   uint8x16_t __s1 = __p1; \
  42476   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42477   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42478   __ret = (poly8x16_t) __builtin_neon_vluti2_laneq_p8((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 36); \
  42479   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42480   __ret; \
  42481 })
  42482 #endif
  42483 
  42484 #ifdef __LITTLE_ENDIAN__
  42485 #define vluti2q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \
  42486   poly8x16_t __ret; \
  42487   poly8x16_t __s0 = __p0; \
  42488   uint8x16_t __s1 = __p1; \
  42489   __ret = (poly8x16_t) __builtin_neon_vluti2q_laneq_p8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \
  42490   __ret; \
  42491 })
  42492 #else
  42493 #define vluti2q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \
  42494   poly8x16_t __ret; \
  42495   poly8x16_t __s0 = __p0; \
  42496   uint8x16_t __s1 = __p1; \
  42497   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42498   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42499   __ret = (poly8x16_t) __builtin_neon_vluti2q_laneq_p8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \
  42500   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42501   __ret; \
  42502 })
  42503 #endif
  42504 
  42505 #ifdef __LITTLE_ENDIAN__
  42506 #define vluti2q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \
  42507   uint8x16_t __ret; \
  42508   uint8x16_t __s0 = __p0; \
  42509   uint8x16_t __s1 = __p1; \
  42510   __ret = (uint8x16_t) __builtin_neon_vluti2q_laneq_u8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
  42511   __ret; \
  42512 })
  42513 #else
  42514 #define vluti2q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \
  42515   uint8x16_t __ret; \
  42516   uint8x16_t __s0 = __p0; \
  42517   uint8x16_t __s1 = __p1; \
  42518   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42519   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42520   __ret = (uint8x16_t) __builtin_neon_vluti2q_laneq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  42521   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42522   __ret; \
  42523 })
  42524 #endif
  42525 
  42526 #ifdef __LITTLE_ENDIAN__
  42527 #define vluti2q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \
  42528   int8x16_t __ret; \
  42529   int8x16_t __s0 = __p0; \
  42530   uint8x16_t __s1 = __p1; \
  42531   __ret = (int8x16_t) __builtin_neon_vluti2q_laneq_s8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  42532   __ret; \
  42533 })
  42534 #else
  42535 #define vluti2q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \
  42536   int8x16_t __ret; \
  42537   int8x16_t __s0 = __p0; \
  42538   uint8x16_t __s1 = __p1; \
  42539   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42540   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42541   __ret = (int8x16_t) __builtin_neon_vluti2q_laneq_s8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  42542   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42543   __ret; \
  42544 })
  42545 #endif
  42546 
  42547 #ifdef __LITTLE_ENDIAN__
  42548 #define vluti2_laneq_u8(__p0, __p1, __p2) __extension__ ({ \
  42549   uint8x16_t __ret; \
  42550   uint8x8_t __s0 = __p0; \
  42551   uint8x16_t __s1 = __p1; \
  42552   __ret = (uint8x16_t) __builtin_neon_vluti2_laneq_u8((int8x8_t)__s0, (int8x16_t)__s1, __p2, 48); \
  42553   __ret; \
  42554 })
  42555 #else
  42556 #define vluti2_laneq_u8(__p0, __p1, __p2) __extension__ ({ \
  42557   uint8x16_t __ret; \
  42558   uint8x8_t __s0 = __p0; \
  42559   uint8x16_t __s1 = __p1; \
  42560   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42561   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42562   __ret = (uint8x16_t) __builtin_neon_vluti2_laneq_u8((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  42563   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42564   __ret; \
  42565 })
  42566 #endif
  42567 
  42568 #ifdef __LITTLE_ENDIAN__
  42569 #define vluti2_laneq_s8(__p0, __p1, __p2) __extension__ ({ \
  42570   int8x16_t __ret; \
  42571   int8x8_t __s0 = __p0; \
  42572   uint8x16_t __s1 = __p1; \
  42573   __ret = (int8x16_t) __builtin_neon_vluti2_laneq_s8((int8x8_t)__s0, (int8x16_t)__s1, __p2, 32); \
  42574   __ret; \
  42575 })
  42576 #else
  42577 #define vluti2_laneq_s8(__p0, __p1, __p2) __extension__ ({ \
  42578   int8x16_t __ret; \
  42579   int8x8_t __s0 = __p0; \
  42580   uint8x16_t __s1 = __p1; \
  42581   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42582   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42583   __ret = (int8x16_t) __builtin_neon_vluti2_laneq_s8((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  42584   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42585   __ret; \
  42586 })
  42587 #endif
  42588 
  42589 #ifdef __LITTLE_ENDIAN__
  42590 #define vluti2_laneq_p16(__p0, __p1, __p2) __extension__ ({ \
  42591   poly16x8_t __ret; \
  42592   poly16x4_t __s0 = __p0; \
  42593   uint8x16_t __s1 = __p1; \
  42594   __ret = (poly16x8_t) __builtin_neon_vluti2_laneq_p16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 37); \
  42595   __ret; \
  42596 })
  42597 #else
  42598 #define vluti2_laneq_p16(__p0, __p1, __p2) __extension__ ({ \
  42599   poly16x8_t __ret; \
  42600   poly16x4_t __s0 = __p0; \
  42601   uint8x16_t __s1 = __p1; \
  42602   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42603   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42604   __ret = (poly16x8_t) __builtin_neon_vluti2_laneq_p16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 37); \
  42605   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42606   __ret; \
  42607 })
  42608 #endif
  42609 
  42610 #ifdef __LITTLE_ENDIAN__
  42611 #define vluti2q_laneq_p16(__p0, __p1, __p2) __extension__ ({ \
  42612   poly16x8_t __ret; \
  42613   poly16x8_t __s0 = __p0; \
  42614   uint8x16_t __s1 = __p1; \
  42615   __ret = (poly16x8_t) __builtin_neon_vluti2q_laneq_p16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \
  42616   __ret; \
  42617 })
  42618 #else
  42619 #define vluti2q_laneq_p16(__p0, __p1, __p2) __extension__ ({ \
  42620   poly16x8_t __ret; \
  42621   poly16x8_t __s0 = __p0; \
  42622   uint8x16_t __s1 = __p1; \
  42623   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42624   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42625   __ret = (poly16x8_t) __builtin_neon_vluti2q_laneq_p16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \
  42626   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42627   __ret; \
  42628 })
  42629 #endif
  42630 
  42631 #ifdef __LITTLE_ENDIAN__
  42632 #define vluti2q_laneq_u16(__p0, __p1, __p2) __extension__ ({ \
  42633   uint16x8_t __ret; \
  42634   uint16x8_t __s0 = __p0; \
  42635   uint8x16_t __s1 = __p1; \
  42636   __ret = (uint16x8_t) __builtin_neon_vluti2q_laneq_u16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \
  42637   __ret; \
  42638 })
  42639 #else
  42640 #define vluti2q_laneq_u16(__p0, __p1, __p2) __extension__ ({ \
  42641   uint16x8_t __ret; \
  42642   uint16x8_t __s0 = __p0; \
  42643   uint8x16_t __s1 = __p1; \
  42644   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42645   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42646   __ret = (uint16x8_t) __builtin_neon_vluti2q_laneq_u16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
  42647   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42648   __ret; \
  42649 })
  42650 #endif
  42651 
  42652 #ifdef __LITTLE_ENDIAN__
  42653 #define vluti2q_laneq_f16(__p0, __p1, __p2) __extension__ ({ \
  42654   float16x8_t __ret; \
  42655   float16x8_t __s0 = __p0; \
  42656   uint8x16_t __s1 = __p1; \
  42657   __ret = (float16x8_t) __builtin_neon_vluti2q_laneq_f16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 40); \
  42658   __ret; \
  42659 })
  42660 #else
  42661 #define vluti2q_laneq_f16(__p0, __p1, __p2) __extension__ ({ \
  42662   float16x8_t __ret; \
  42663   float16x8_t __s0 = __p0; \
  42664   uint8x16_t __s1 = __p1; \
  42665   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42666   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42667   __ret = (float16x8_t) __builtin_neon_vluti2q_laneq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 40); \
  42668   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42669   __ret; \
  42670 })
  42671 #endif
  42672 
  42673 #ifdef __LITTLE_ENDIAN__
  42674 #define vluti2q_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  42675   int16x8_t __ret; \
  42676   int16x8_t __s0 = __p0; \
  42677   uint8x16_t __s1 = __p1; \
  42678   __ret = (int16x8_t) __builtin_neon_vluti2q_laneq_s16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  42679   __ret; \
  42680 })
  42681 #else
  42682 #define vluti2q_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  42683   int16x8_t __ret; \
  42684   int16x8_t __s0 = __p0; \
  42685   uint8x16_t __s1 = __p1; \
  42686   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  42687   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42688   __ret = (int16x8_t) __builtin_neon_vluti2q_laneq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  42689   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42690   __ret; \
  42691 })
  42692 #endif
  42693 
  42694 #ifdef __LITTLE_ENDIAN__
  42695 #define vluti2_laneq_u16(__p0, __p1, __p2) __extension__ ({ \
  42696   uint16x8_t __ret; \
  42697   uint16x4_t __s0 = __p0; \
  42698   uint8x16_t __s1 = __p1; \
  42699   __ret = (uint16x8_t) __builtin_neon_vluti2_laneq_u16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 49); \
  42700   __ret; \
  42701 })
  42702 #else
  42703 #define vluti2_laneq_u16(__p0, __p1, __p2) __extension__ ({ \
  42704   uint16x8_t __ret; \
  42705   uint16x4_t __s0 = __p0; \
  42706   uint8x16_t __s1 = __p1; \
  42707   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42708   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42709   __ret = (uint16x8_t) __builtin_neon_vluti2_laneq_u16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 49); \
  42710   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42711   __ret; \
  42712 })
  42713 #endif
  42714 
  42715 #ifdef __LITTLE_ENDIAN__
  42716 #define vluti2_laneq_f16(__p0, __p1, __p2) __extension__ ({ \
  42717   float16x8_t __ret; \
  42718   float16x4_t __s0 = __p0; \
  42719   uint8x16_t __s1 = __p1; \
  42720   __ret = (float16x8_t) __builtin_neon_vluti2_laneq_f16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 40); \
  42721   __ret; \
  42722 })
  42723 #else
  42724 #define vluti2_laneq_f16(__p0, __p1, __p2) __extension__ ({ \
  42725   float16x8_t __ret; \
  42726   float16x4_t __s0 = __p0; \
  42727   uint8x16_t __s1 = __p1; \
  42728   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42729   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42730   __ret = (float16x8_t) __builtin_neon_vluti2_laneq_f16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 40); \
  42731   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42732   __ret; \
  42733 })
  42734 #endif
  42735 
  42736 #ifdef __LITTLE_ENDIAN__
  42737 #define vluti2_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  42738   int16x8_t __ret; \
  42739   int16x4_t __s0 = __p0; \
  42740   uint8x16_t __s1 = __p1; \
  42741   __ret = (int16x8_t) __builtin_neon_vluti2_laneq_s16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 33); \
  42742   __ret; \
  42743 })
  42744 #else
  42745 #define vluti2_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  42746   int16x8_t __ret; \
  42747   int16x4_t __s0 = __p0; \
  42748   uint8x16_t __s1 = __p1; \
  42749   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  42750   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42751   __ret = (int16x8_t) __builtin_neon_vluti2_laneq_s16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  42752   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42753   __ret; \
  42754 })
  42755 #endif
  42756 
  42757 #ifdef __LITTLE_ENDIAN__
  42758 #define vluti4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  42759   poly8x16_t __ret; \
  42760   poly8x16_t __s0 = __p0; \
  42761   uint8x8_t __s1 = __p1; \
  42762   __ret = (poly8x16_t) __builtin_neon_vluti4q_lane_p8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 36); \
  42763   __ret; \
  42764 })
  42765 #else
  42766 #define vluti4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  42767   poly8x16_t __ret; \
  42768   poly8x16_t __s0 = __p0; \
  42769   uint8x8_t __s1 = __p1; \
  42770   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42771   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42772   __ret = (poly8x16_t) __builtin_neon_vluti4q_lane_p8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 36); \
  42773   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42774   __ret; \
  42775 })
  42776 #endif
  42777 
  42778 #ifdef __LITTLE_ENDIAN__
  42779 #define vluti4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  42780   uint8x16_t __ret; \
  42781   uint8x16_t __s0 = __p0; \
  42782   uint8x8_t __s1 = __p1; \
  42783   __ret = (uint8x16_t) __builtin_neon_vluti4q_lane_u8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 48); \
  42784   __ret; \
  42785 })
  42786 #else
  42787 #define vluti4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  42788   uint8x16_t __ret; \
  42789   uint8x16_t __s0 = __p0; \
  42790   uint8x8_t __s1 = __p1; \
  42791   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42792   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42793   __ret = (uint8x16_t) __builtin_neon_vluti4q_lane_u8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 48); \
  42794   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42795   __ret; \
  42796 })
  42797 #endif
  42798 
  42799 #ifdef __LITTLE_ENDIAN__
  42800 #define vluti4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  42801   int8x16_t __ret; \
  42802   int8x16_t __s0 = __p0; \
  42803   uint8x8_t __s1 = __p1; \
  42804   __ret = (int8x16_t) __builtin_neon_vluti4q_lane_s8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 32); \
  42805   __ret; \
  42806 })
  42807 #else
  42808 #define vluti4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  42809   int8x16_t __ret; \
  42810   int8x16_t __s0 = __p0; \
  42811   uint8x8_t __s1 = __p1; \
  42812   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42813   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42814   __ret = (int8x16_t) __builtin_neon_vluti4q_lane_s8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 32); \
  42815   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42816   __ret; \
  42817 })
  42818 #endif
  42819 
  42820 #ifdef __LITTLE_ENDIAN__
  42821 #define vluti4q_lane_p16_x2(__p0, __p1, __p2) __extension__ ({ \
  42822   poly16x8_t __ret; \
  42823   poly16x8x2_t __s0 = __p0; \
  42824   uint8x8_t __s1 = __p1; \
  42825   __ret = (poly16x8_t) __builtin_neon_vluti4q_lane_p16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 37); \
  42826   __ret; \
  42827 })
  42828 #else
  42829 #define vluti4q_lane_p16_x2(__p0, __p1, __p2) __extension__ ({ \
  42830   poly16x8_t __ret; \
  42831   poly16x8x2_t __s0 = __p0; \
  42832   uint8x8_t __s1 = __p1; \
  42833   poly16x8x2_t __rev0; \
  42834   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  42835   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  42836   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42837   __ret = (poly16x8_t) __builtin_neon_vluti4q_lane_p16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 37); \
  42838   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42839   __ret; \
  42840 })
  42841 #endif
  42842 
  42843 #ifdef __LITTLE_ENDIAN__
  42844 #define vluti4q_lane_u16_x2(__p0, __p1, __p2) __extension__ ({ \
  42845   uint16x8_t __ret; \
  42846   uint16x8x2_t __s0 = __p0; \
  42847   uint8x8_t __s1 = __p1; \
  42848   __ret = (uint16x8_t) __builtin_neon_vluti4q_lane_u16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 49); \
  42849   __ret; \
  42850 })
  42851 #else
  42852 #define vluti4q_lane_u16_x2(__p0, __p1, __p2) __extension__ ({ \
  42853   uint16x8_t __ret; \
  42854   uint16x8x2_t __s0 = __p0; \
  42855   uint8x8_t __s1 = __p1; \
  42856   uint16x8x2_t __rev0; \
  42857   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  42858   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  42859   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42860   __ret = (uint16x8_t) __builtin_neon_vluti4q_lane_u16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 49); \
  42861   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42862   __ret; \
  42863 })
  42864 #endif
  42865 
  42866 #ifdef __LITTLE_ENDIAN__
  42867 #define vluti4q_lane_f16_x2(__p0, __p1, __p2) __extension__ ({ \
  42868   float16x8_t __ret; \
  42869   float16x8x2_t __s0 = __p0; \
  42870   uint8x8_t __s1 = __p1; \
  42871   __ret = (float16x8_t) __builtin_neon_vluti4q_lane_f16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 40); \
  42872   __ret; \
  42873 })
  42874 #else
  42875 #define vluti4q_lane_f16_x2(__p0, __p1, __p2) __extension__ ({ \
  42876   float16x8_t __ret; \
  42877   float16x8x2_t __s0 = __p0; \
  42878   uint8x8_t __s1 = __p1; \
  42879   float16x8x2_t __rev0; \
  42880   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  42881   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  42882   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42883   __ret = (float16x8_t) __builtin_neon_vluti4q_lane_f16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 40); \
  42884   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42885   __ret; \
  42886 })
  42887 #endif
  42888 
  42889 #ifdef __LITTLE_ENDIAN__
  42890 #define vluti4q_lane_s16_x2(__p0, __p1, __p2) __extension__ ({ \
  42891   int16x8_t __ret; \
  42892   int16x8x2_t __s0 = __p0; \
  42893   uint8x8_t __s1 = __p1; \
  42894   __ret = (int16x8_t) __builtin_neon_vluti4q_lane_s16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 33); \
  42895   __ret; \
  42896 })
  42897 #else
  42898 #define vluti4q_lane_s16_x2(__p0, __p1, __p2) __extension__ ({ \
  42899   int16x8_t __ret; \
  42900   int16x8x2_t __s0 = __p0; \
  42901   uint8x8_t __s1 = __p1; \
  42902   int16x8x2_t __rev0; \
  42903   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  42904   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  42905   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  42906   __ret = (int16x8_t) __builtin_neon_vluti4q_lane_s16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 33); \
  42907   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42908   __ret; \
  42909 })
  42910 #endif
  42911 
  42912 #ifdef __LITTLE_ENDIAN__
  42913 #define vluti4q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \
  42914   poly8x16_t __ret; \
  42915   poly8x16_t __s0 = __p0; \
  42916   uint8x16_t __s1 = __p1; \
  42917   __ret = (poly8x16_t) __builtin_neon_vluti4q_laneq_p8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \
  42918   __ret; \
  42919 })
  42920 #else
  42921 #define vluti4q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \
  42922   poly8x16_t __ret; \
  42923   poly8x16_t __s0 = __p0; \
  42924   uint8x16_t __s1 = __p1; \
  42925   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42926   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42927   __ret = (poly8x16_t) __builtin_neon_vluti4q_laneq_p8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \
  42928   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42929   __ret; \
  42930 })
  42931 #endif
  42932 
  42933 #ifdef __LITTLE_ENDIAN__
  42934 #define vluti4q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \
  42935   uint8x16_t __ret; \
  42936   uint8x16_t __s0 = __p0; \
  42937   uint8x16_t __s1 = __p1; \
  42938   __ret = (uint8x16_t) __builtin_neon_vluti4q_laneq_u8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \
  42939   __ret; \
  42940 })
  42941 #else
  42942 #define vluti4q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \
  42943   uint8x16_t __ret; \
  42944   uint8x16_t __s0 = __p0; \
  42945   uint8x16_t __s1 = __p1; \
  42946   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42947   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42948   __ret = (uint8x16_t) __builtin_neon_vluti4q_laneq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \
  42949   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42950   __ret; \
  42951 })
  42952 #endif
  42953 
  42954 #ifdef __LITTLE_ENDIAN__
  42955 #define vluti4q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \
  42956   int8x16_t __ret; \
  42957   int8x16_t __s0 = __p0; \
  42958   uint8x16_t __s1 = __p1; \
  42959   __ret = (int8x16_t) __builtin_neon_vluti4q_laneq_s8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \
  42960   __ret; \
  42961 })
  42962 #else
  42963 #define vluti4q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \
  42964   int8x16_t __ret; \
  42965   int8x16_t __s0 = __p0; \
  42966   uint8x16_t __s1 = __p1; \
  42967   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42968   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42969   __ret = (int8x16_t) __builtin_neon_vluti4q_laneq_s8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \
  42970   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42971   __ret; \
  42972 })
  42973 #endif
  42974 
  42975 #ifdef __LITTLE_ENDIAN__
  42976 #define vluti4q_laneq_p16_x2(__p0, __p1, __p2) __extension__ ({ \
  42977   poly16x8_t __ret; \
  42978   poly16x8x2_t __s0 = __p0; \
  42979   uint8x16_t __s1 = __p1; \
  42980   __ret = (poly16x8_t) __builtin_neon_vluti4q_laneq_p16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 37); \
  42981   __ret; \
  42982 })
  42983 #else
  42984 #define vluti4q_laneq_p16_x2(__p0, __p1, __p2) __extension__ ({ \
  42985   poly16x8_t __ret; \
  42986   poly16x8x2_t __s0 = __p0; \
  42987   uint8x16_t __s1 = __p1; \
  42988   poly16x8x2_t __rev0; \
  42989   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  42990   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  42991   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  42992   __ret = (poly16x8_t) __builtin_neon_vluti4q_laneq_p16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 37); \
  42993   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  42994   __ret; \
  42995 })
  42996 #endif
  42997 
  42998 #ifdef __LITTLE_ENDIAN__
  42999 #define vluti4q_laneq_u16_x2(__p0, __p1, __p2) __extension__ ({ \
  43000   uint16x8_t __ret; \
  43001   uint16x8x2_t __s0 = __p0; \
  43002   uint8x16_t __s1 = __p1; \
  43003   __ret = (uint16x8_t) __builtin_neon_vluti4q_laneq_u16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 49); \
  43004   __ret; \
  43005 })
  43006 #else
  43007 #define vluti4q_laneq_u16_x2(__p0, __p1, __p2) __extension__ ({ \
  43008   uint16x8_t __ret; \
  43009   uint16x8x2_t __s0 = __p0; \
  43010   uint8x16_t __s1 = __p1; \
  43011   uint16x8x2_t __rev0; \
  43012   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  43013   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  43014   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43015   __ret = (uint16x8_t) __builtin_neon_vluti4q_laneq_u16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 49); \
  43016   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43017   __ret; \
  43018 })
  43019 #endif
  43020 
  43021 #ifdef __LITTLE_ENDIAN__
  43022 #define vluti4q_laneq_f16_x2(__p0, __p1, __p2) __extension__ ({ \
  43023   float16x8_t __ret; \
  43024   float16x8x2_t __s0 = __p0; \
  43025   uint8x16_t __s1 = __p1; \
  43026   __ret = (float16x8_t) __builtin_neon_vluti4q_laneq_f16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 40); \
  43027   __ret; \
  43028 })
  43029 #else
  43030 #define vluti4q_laneq_f16_x2(__p0, __p1, __p2) __extension__ ({ \
  43031   float16x8_t __ret; \
  43032   float16x8x2_t __s0 = __p0; \
  43033   uint8x16_t __s1 = __p1; \
  43034   float16x8x2_t __rev0; \
  43035   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  43036   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  43037   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43038   __ret = (float16x8_t) __builtin_neon_vluti4q_laneq_f16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 40); \
  43039   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43040   __ret; \
  43041 })
  43042 #endif
  43043 
  43044 #ifdef __LITTLE_ENDIAN__
  43045 #define vluti4q_laneq_s16_x2(__p0, __p1, __p2) __extension__ ({ \
  43046   int16x8_t __ret; \
  43047   int16x8x2_t __s0 = __p0; \
  43048   uint8x16_t __s1 = __p1; \
  43049   __ret = (int16x8_t) __builtin_neon_vluti4q_laneq_s16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 33); \
  43050   __ret; \
  43051 })
  43052 #else
  43053 #define vluti4q_laneq_s16_x2(__p0, __p1, __p2) __extension__ ({ \
  43054   int16x8_t __ret; \
  43055   int16x8x2_t __s0 = __p0; \
  43056   uint8x16_t __s1 = __p1; \
  43057   int16x8x2_t __rev0; \
  43058   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  43059   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  43060   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43061   __ret = (int16x8_t) __builtin_neon_vluti4q_laneq_s16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 33); \
  43062   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43063   __ret; \
  43064 })
  43065 #endif
  43066 
  43067 #ifdef __LITTLE_ENDIAN__
  43068 #define vluti2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
  43069   bfloat16x8_t __ret; \
  43070   bfloat16x8_t __s0 = __p0; \
  43071   uint8x8_t __s1 = __p1; \
  43072   __ret = (bfloat16x8_t) __builtin_neon_vluti2q_lane_bf16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 43); \
  43073   __ret; \
  43074 })
  43075 #else
  43076 #define vluti2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
  43077   bfloat16x8_t __ret; \
  43078   bfloat16x8_t __s0 = __p0; \
  43079   uint8x8_t __s1 = __p1; \
  43080   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  43081   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  43082   __ret = (bfloat16x8_t) __builtin_neon_vluti2q_lane_bf16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 43); \
  43083   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43084   __ret; \
  43085 })
  43086 #endif
  43087 
  43088 #ifdef __LITTLE_ENDIAN__
  43089 #define vluti2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
  43090   bfloat16x8_t __ret; \
  43091   bfloat16x4_t __s0 = __p0; \
  43092   uint8x8_t __s1 = __p1; \
  43093   __ret = (bfloat16x8_t) __builtin_neon_vluti2_lane_bf16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 43); \
  43094   __ret; \
  43095 })
  43096 #else
  43097 #define vluti2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \
  43098   bfloat16x8_t __ret; \
  43099   bfloat16x4_t __s0 = __p0; \
  43100   uint8x8_t __s1 = __p1; \
  43101   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  43102   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  43103   __ret = (bfloat16x8_t) __builtin_neon_vluti2_lane_bf16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 43); \
  43104   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43105   __ret; \
  43106 })
  43107 #endif
  43108 
  43109 #ifdef __LITTLE_ENDIAN__
  43110 #define vluti2q_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \
  43111   bfloat16x8_t __ret; \
  43112   bfloat16x8_t __s0 = __p0; \
  43113   uint8x16_t __s1 = __p1; \
  43114   __ret = (bfloat16x8_t) __builtin_neon_vluti2q_laneq_bf16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 43); \
  43115   __ret; \
  43116 })
  43117 #else
  43118 #define vluti2q_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \
  43119   bfloat16x8_t __ret; \
  43120   bfloat16x8_t __s0 = __p0; \
  43121   uint8x16_t __s1 = __p1; \
  43122   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  43123   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43124   __ret = (bfloat16x8_t) __builtin_neon_vluti2q_laneq_bf16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 43); \
  43125   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43126   __ret; \
  43127 })
  43128 #endif
  43129 
  43130 #ifdef __LITTLE_ENDIAN__
  43131 #define vluti2_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \
  43132   bfloat16x8_t __ret; \
  43133   bfloat16x4_t __s0 = __p0; \
  43134   uint8x16_t __s1 = __p1; \
  43135   __ret = (bfloat16x8_t) __builtin_neon_vluti2_laneq_bf16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 43); \
  43136   __ret; \
  43137 })
  43138 #else
  43139 #define vluti2_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \
  43140   bfloat16x8_t __ret; \
  43141   bfloat16x4_t __s0 = __p0; \
  43142   uint8x16_t __s1 = __p1; \
  43143   bfloat16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  43144   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43145   __ret = (bfloat16x8_t) __builtin_neon_vluti2_laneq_bf16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 43); \
  43146   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43147   __ret; \
  43148 })
  43149 #endif
  43150 
  43151 #ifdef __LITTLE_ENDIAN__
  43152 #define vluti4q_lane_bf16_x2(__p0, __p1, __p2) __extension__ ({ \
  43153   bfloat16x8_t __ret; \
  43154   bfloat16x8x2_t __s0 = __p0; \
  43155   uint8x8_t __s1 = __p1; \
  43156   __ret = (bfloat16x8_t) __builtin_neon_vluti4q_lane_bf16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 43); \
  43157   __ret; \
  43158 })
  43159 #else
  43160 #define vluti4q_lane_bf16_x2(__p0, __p1, __p2) __extension__ ({ \
  43161   bfloat16x8_t __ret; \
  43162   bfloat16x8x2_t __s0 = __p0; \
  43163   uint8x8_t __s1 = __p1; \
  43164   bfloat16x8x2_t __rev0; \
  43165   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  43166   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  43167   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  43168   __ret = (bfloat16x8_t) __builtin_neon_vluti4q_lane_bf16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 43); \
  43169   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43170   __ret; \
  43171 })
  43172 #endif
  43173 
  43174 #ifdef __LITTLE_ENDIAN__
  43175 #define vluti4q_laneq_bf16_x2(__p0, __p1, __p2) __extension__ ({ \
  43176   bfloat16x8_t __ret; \
  43177   bfloat16x8x2_t __s0 = __p0; \
  43178   uint8x16_t __s1 = __p1; \
  43179   __ret = (bfloat16x8_t) __builtin_neon_vluti4q_laneq_bf16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 43); \
  43180   __ret; \
  43181 })
  43182 #else
  43183 #define vluti4q_laneq_bf16_x2(__p0, __p1, __p2) __extension__ ({ \
  43184   bfloat16x8_t __ret; \
  43185   bfloat16x8x2_t __s0 = __p0; \
  43186   uint8x16_t __s1 = __p1; \
  43187   bfloat16x8x2_t __rev0; \
  43188   __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \
  43189   __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \
  43190   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43191   __ret = (bfloat16x8_t) __builtin_neon_vluti4q_laneq_bf16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 43); \
  43192   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  43193   __ret; \
  43194 })
  43195 #endif
  43196 
  43197 #ifdef __LITTLE_ENDIAN__
  43198 __ai __attribute__((target("neon,faminmax"))) float64x2_t vamaxq_f64(float64x2_t __p0, float64x2_t __p1) {
  43199   float64x2_t __ret;
  43200   __ret = (float64x2_t) __builtin_neon_vamaxq_f64((int8x16_t)__p0, (int8x16_t)__p1, 42);
  43201   return __ret;
  43202 }
  43203 #else
  43204 __ai __attribute__((target("neon,faminmax"))) float64x2_t vamaxq_f64(float64x2_t __p0, float64x2_t __p1) {
  43205   float64x2_t __ret;
  43206   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  43207   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  43208   __ret = (float64x2_t) __builtin_neon_vamaxq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  43209   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  43210   return __ret;
  43211 }
  43212 #endif
  43213 
  43214 #ifdef __LITTLE_ENDIAN__
  43215 __ai __attribute__((target("neon,faminmax"))) float32x4_t vamaxq_f32(float32x4_t __p0, float32x4_t __p1) {
  43216   float32x4_t __ret;
  43217   __ret = (float32x4_t) __builtin_neon_vamaxq_f32((int8x16_t)__p0, (int8x16_t)__p1, 41);
  43218   return __ret;
  43219 }
  43220 #else
  43221 __ai __attribute__((target("neon,faminmax"))) float32x4_t vamaxq_f32(float32x4_t __p0, float32x4_t __p1) {
  43222   float32x4_t __ret;
  43223   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43224   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43225   __ret = (float32x4_t) __builtin_neon_vamaxq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  43226   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43227   return __ret;
  43228 }
  43229 #endif
  43230 
  43231 #ifdef __LITTLE_ENDIAN__
  43232 __ai __attribute__((target("neon,faminmax"))) float16x8_t vamaxq_f16(float16x8_t __p0, float16x8_t __p1) {
  43233   float16x8_t __ret;
  43234   __ret = (float16x8_t) __builtin_neon_vamaxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  43235   return __ret;
  43236 }
  43237 #else
  43238 __ai __attribute__((target("neon,faminmax"))) float16x8_t vamaxq_f16(float16x8_t __p0, float16x8_t __p1) {
  43239   float16x8_t __ret;
  43240   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  43241   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  43242   __ret = (float16x8_t) __builtin_neon_vamaxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  43243   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  43244   return __ret;
  43245 }
  43246 #endif
  43247 
  43248 #ifdef __LITTLE_ENDIAN__
  43249 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamax_f32(float32x2_t __p0, float32x2_t __p1) {
  43250   float32x2_t __ret;
  43251   __ret = (float32x2_t) __builtin_neon_vamax_f32((int8x8_t)__p0, (int8x8_t)__p1, 9);
  43252   return __ret;
  43253 }
  43254 #else
  43255 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamax_f32(float32x2_t __p0, float32x2_t __p1) {
  43256   float32x2_t __ret;
  43257   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  43258   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  43259   __ret = (float32x2_t) __builtin_neon_vamax_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  43260   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  43261   return __ret;
  43262 }
  43263 #endif
  43264 
  43265 #ifdef __LITTLE_ENDIAN__
  43266 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamax_f16(float16x4_t __p0, float16x4_t __p1) {
  43267   float16x4_t __ret;
  43268   __ret = (float16x4_t) __builtin_neon_vamax_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  43269   return __ret;
  43270 }
  43271 #else
  43272 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamax_f16(float16x4_t __p0, float16x4_t __p1) {
  43273   float16x4_t __ret;
  43274   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43275   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43276   __ret = (float16x4_t) __builtin_neon_vamax_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  43277   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43278   return __ret;
  43279 }
  43280 #endif
  43281 
  43282 #ifdef __LITTLE_ENDIAN__
  43283 __ai __attribute__((target("neon,faminmax"))) float64x2_t vaminq_f64(float64x2_t __p0, float64x2_t __p1) {
  43284   float64x2_t __ret;
  43285   __ret = (float64x2_t) __builtin_neon_vaminq_f64((int8x16_t)__p0, (int8x16_t)__p1, 42);
  43286   return __ret;
  43287 }
  43288 #else
  43289 __ai __attribute__((target("neon,faminmax"))) float64x2_t vaminq_f64(float64x2_t __p0, float64x2_t __p1) {
  43290   float64x2_t __ret;
  43291   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  43292   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  43293   __ret = (float64x2_t) __builtin_neon_vaminq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  43294   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  43295   return __ret;
  43296 }
  43297 #endif
  43298 
  43299 #ifdef __LITTLE_ENDIAN__
  43300 __ai __attribute__((target("neon,faminmax"))) float32x4_t vaminq_f32(float32x4_t __p0, float32x4_t __p1) {
  43301   float32x4_t __ret;
  43302   __ret = (float32x4_t) __builtin_neon_vaminq_f32((int8x16_t)__p0, (int8x16_t)__p1, 41);
  43303   return __ret;
  43304 }
  43305 #else
  43306 __ai __attribute__((target("neon,faminmax"))) float32x4_t vaminq_f32(float32x4_t __p0, float32x4_t __p1) {
  43307   float32x4_t __ret;
  43308   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43309   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43310   __ret = (float32x4_t) __builtin_neon_vaminq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  43311   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43312   return __ret;
  43313 }
  43314 #endif
  43315 
  43316 #ifdef __LITTLE_ENDIAN__
  43317 __ai __attribute__((target("neon,faminmax"))) float16x8_t vaminq_f16(float16x8_t __p0, float16x8_t __p1) {
  43318   float16x8_t __ret;
  43319   __ret = (float16x8_t) __builtin_neon_vaminq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  43320   return __ret;
  43321 }
  43322 #else
  43323 __ai __attribute__((target("neon,faminmax"))) float16x8_t vaminq_f16(float16x8_t __p0, float16x8_t __p1) {
  43324   float16x8_t __ret;
  43325   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  43326   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  43327   __ret = (float16x8_t) __builtin_neon_vaminq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  43328   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  43329   return __ret;
  43330 }
  43331 #endif
  43332 
  43333 #ifdef __LITTLE_ENDIAN__
  43334 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamin_f32(float32x2_t __p0, float32x2_t __p1) {
  43335   float32x2_t __ret;
  43336   __ret = (float32x2_t) __builtin_neon_vamin_f32((int8x8_t)__p0, (int8x8_t)__p1, 9);
  43337   return __ret;
  43338 }
  43339 #else
  43340 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamin_f32(float32x2_t __p0, float32x2_t __p1) {
  43341   float32x2_t __ret;
  43342   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  43343   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  43344   __ret = (float32x2_t) __builtin_neon_vamin_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  43345   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  43346   return __ret;
  43347 }
  43348 #endif
  43349 
  43350 #ifdef __LITTLE_ENDIAN__
  43351 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamin_f16(float16x4_t __p0, float16x4_t __p1) {
  43352   float16x4_t __ret;
  43353   __ret = (float16x4_t) __builtin_neon_vamin_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  43354   return __ret;
  43355 }
  43356 #else
  43357 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamin_f16(float16x4_t __p0, float16x4_t __p1) {
  43358   float16x4_t __ret;
  43359   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43360   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43361   __ret = (float16x4_t) __builtin_neon_vamin_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  43362   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43363   return __ret;
  43364 }
  43365 #endif
  43366 
  43367 #endif
  43368 #if defined(__aarch64__) || defined(__arm64ec__)
  43369 __ai __attribute__((target("aes,neon"))) poly128_t vmull_p64(poly64_t __p0, poly64_t __p1) {
  43370   poly128_t __ret;
  43371   __ret = (poly128_t) __builtin_neon_vmull_p64(__p0, __p1);
  43372   return __ret;
  43373 }
  43374 #ifdef __LITTLE_ENDIAN__
  43375 #define vcopyq_lane_bf16(__p0_230, __p1_230, __p2_230, __p3_230) __extension__ ({ \
  43376   bfloat16x8_t __ret_230; \
  43377   bfloat16x8_t __s0_230 = __p0_230; \
  43378   bfloat16x4_t __s2_230 = __p2_230; \
  43379   __ret_230 = vsetq_lane_bf16(vget_lane_bf16(__s2_230, __p3_230), __s0_230, __p1_230); \
  43380   __ret_230; \
  43381 })
  43382 #else
  43383 #define vcopyq_lane_bf16(__p0_231, __p1_231, __p2_231, __p3_231) __extension__ ({ \
  43384   bfloat16x8_t __ret_231; \
  43385   bfloat16x8_t __s0_231 = __p0_231; \
  43386   bfloat16x4_t __s2_231 = __p2_231; \
  43387   bfloat16x8_t __rev0_231;  __rev0_231 = __builtin_shufflevector(__s0_231, __s0_231, 7, 6, 5, 4, 3, 2, 1, 0); \
  43388   bfloat16x4_t __rev2_231;  __rev2_231 = __builtin_shufflevector(__s2_231, __s2_231, 3, 2, 1, 0); \
  43389   __ret_231 = __noswap_vsetq_lane_bf16(__noswap_vget_lane_bf16(__rev2_231, __p3_231), __rev0_231, __p1_231); \
  43390   __ret_231 = __builtin_shufflevector(__ret_231, __ret_231, 7, 6, 5, 4, 3, 2, 1, 0); \
  43391   __ret_231; \
  43392 })
  43393 #endif
  43394 
  43395 #ifdef __LITTLE_ENDIAN__
  43396 #define vcopy_lane_bf16(__p0_232, __p1_232, __p2_232, __p3_232) __extension__ ({ \
  43397   bfloat16x4_t __ret_232; \
  43398   bfloat16x4_t __s0_232 = __p0_232; \
  43399   bfloat16x4_t __s2_232 = __p2_232; \
  43400   __ret_232 = vset_lane_bf16(vget_lane_bf16(__s2_232, __p3_232), __s0_232, __p1_232); \
  43401   __ret_232; \
  43402 })
  43403 #else
  43404 #define vcopy_lane_bf16(__p0_233, __p1_233, __p2_233, __p3_233) __extension__ ({ \
  43405   bfloat16x4_t __ret_233; \
  43406   bfloat16x4_t __s0_233 = __p0_233; \
  43407   bfloat16x4_t __s2_233 = __p2_233; \
  43408   bfloat16x4_t __rev0_233;  __rev0_233 = __builtin_shufflevector(__s0_233, __s0_233, 3, 2, 1, 0); \
  43409   bfloat16x4_t __rev2_233;  __rev2_233 = __builtin_shufflevector(__s2_233, __s2_233, 3, 2, 1, 0); \
  43410   __ret_233 = __noswap_vset_lane_bf16(__noswap_vget_lane_bf16(__rev2_233, __p3_233), __rev0_233, __p1_233); \
  43411   __ret_233 = __builtin_shufflevector(__ret_233, __ret_233, 3, 2, 1, 0); \
  43412   __ret_233; \
  43413 })
  43414 #endif
  43415 
  43416 #ifdef __LITTLE_ENDIAN__
  43417 #define vcopyq_laneq_bf16(__p0_234, __p1_234, __p2_234, __p3_234) __extension__ ({ \
  43418   bfloat16x8_t __ret_234; \
  43419   bfloat16x8_t __s0_234 = __p0_234; \
  43420   bfloat16x8_t __s2_234 = __p2_234; \
  43421   __ret_234 = vsetq_lane_bf16(vgetq_lane_bf16(__s2_234, __p3_234), __s0_234, __p1_234); \
  43422   __ret_234; \
  43423 })
  43424 #else
  43425 #define vcopyq_laneq_bf16(__p0_235, __p1_235, __p2_235, __p3_235) __extension__ ({ \
  43426   bfloat16x8_t __ret_235; \
  43427   bfloat16x8_t __s0_235 = __p0_235; \
  43428   bfloat16x8_t __s2_235 = __p2_235; \
  43429   bfloat16x8_t __rev0_235;  __rev0_235 = __builtin_shufflevector(__s0_235, __s0_235, 7, 6, 5, 4, 3, 2, 1, 0); \
  43430   bfloat16x8_t __rev2_235;  __rev2_235 = __builtin_shufflevector(__s2_235, __s2_235, 7, 6, 5, 4, 3, 2, 1, 0); \
  43431   __ret_235 = __noswap_vsetq_lane_bf16(__noswap_vgetq_lane_bf16(__rev2_235, __p3_235), __rev0_235, __p1_235); \
  43432   __ret_235 = __builtin_shufflevector(__ret_235, __ret_235, 7, 6, 5, 4, 3, 2, 1, 0); \
  43433   __ret_235; \
  43434 })
  43435 #endif
  43436 
  43437 #ifdef __LITTLE_ENDIAN__
  43438 #define vcopy_laneq_bf16(__p0_236, __p1_236, __p2_236, __p3_236) __extension__ ({ \
  43439   bfloat16x4_t __ret_236; \
  43440   bfloat16x4_t __s0_236 = __p0_236; \
  43441   bfloat16x8_t __s2_236 = __p2_236; \
  43442   __ret_236 = vset_lane_bf16(vgetq_lane_bf16(__s2_236, __p3_236), __s0_236, __p1_236); \
  43443   __ret_236; \
  43444 })
  43445 #else
  43446 #define vcopy_laneq_bf16(__p0_237, __p1_237, __p2_237, __p3_237) __extension__ ({ \
  43447   bfloat16x4_t __ret_237; \
  43448   bfloat16x4_t __s0_237 = __p0_237; \
  43449   bfloat16x8_t __s2_237 = __p2_237; \
  43450   bfloat16x4_t __rev0_237;  __rev0_237 = __builtin_shufflevector(__s0_237, __s0_237, 3, 2, 1, 0); \
  43451   bfloat16x8_t __rev2_237;  __rev2_237 = __builtin_shufflevector(__s2_237, __s2_237, 7, 6, 5, 4, 3, 2, 1, 0); \
  43452   __ret_237 = __noswap_vset_lane_bf16(__noswap_vgetq_lane_bf16(__rev2_237, __p3_237), __rev0_237, __p1_237); \
  43453   __ret_237 = __builtin_shufflevector(__ret_237, __ret_237, 3, 2, 1, 0); \
  43454   __ret_237; \
  43455 })
  43456 #endif
  43457 
  43458 #ifdef __LITTLE_ENDIAN__
  43459 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) {
  43460   bfloat16x4_t __ret;
  43461   __ret = (bfloat16x4_t) __builtin_neon_vcvt_bf16_f32((int8x16_t)__p0, 11);
  43462   return __ret;
  43463 }
  43464 #else
  43465 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) {
  43466   bfloat16x4_t __ret;
  43467   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43468   __ret = (bfloat16x4_t) __builtin_neon_vcvt_bf16_f32((int8x16_t)__rev0, 11);
  43469   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43470   return __ret;
  43471 }
  43472 #endif
  43473 
  43474 #ifdef __LITTLE_ENDIAN__
  43475 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) {
  43476   bfloat16x8_t __ret;
  43477   __ret = (bfloat16x8_t) __builtin_neon_vcvtq_high_bf16_f32((int8x16_t)__p0, (int8x16_t)__p1, 43);
  43478   return __ret;
  43479 }
  43480 #else
  43481 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) {
  43482   bfloat16x8_t __ret;
  43483   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  43484   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43485   __ret = (bfloat16x8_t) __builtin_neon_vcvtq_high_bf16_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 43);
  43486   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  43487   return __ret;
  43488 }
  43489 #endif
  43490 
  43491 #ifdef __LITTLE_ENDIAN__
  43492 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) {
  43493   bfloat16x8_t __ret;
  43494   __ret = (bfloat16x8_t) __builtin_neon_vcvtq_low_bf16_f32((int8x16_t)__p0, 43);
  43495   return __ret;
  43496 }
  43497 #else
  43498 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) {
  43499   bfloat16x8_t __ret;
  43500   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43501   __ret = (bfloat16x8_t) __builtin_neon_vcvtq_low_bf16_f32((int8x16_t)__rev0, 43);
  43502   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  43503   return __ret;
  43504 }
  43505 #endif
  43506 
  43507 __ai __attribute__((target("bf16,neon"))) poly8x8_t vreinterpret_p8_bf16(bfloat16x4_t __p0) {
  43508   poly8x8_t __ret;
  43509   __ret = (poly8x8_t)(__p0);
  43510   return __ret;
  43511 }
  43512 __ai __attribute__((target("bf16,neon"))) poly64x1_t vreinterpret_p64_bf16(bfloat16x4_t __p0) {
  43513   poly64x1_t __ret;
  43514   __ret = (poly64x1_t)(__p0);
  43515   return __ret;
  43516 }
  43517 __ai __attribute__((target("bf16,neon"))) poly16x4_t vreinterpret_p16_bf16(bfloat16x4_t __p0) {
  43518   poly16x4_t __ret;
  43519   __ret = (poly16x4_t)(__p0);
  43520   return __ret;
  43521 }
  43522 __ai __attribute__((target("bf16,neon"))) poly8x16_t vreinterpretq_p8_bf16(bfloat16x8_t __p0) {
  43523   poly8x16_t __ret;
  43524   __ret = (poly8x16_t)(__p0);
  43525   return __ret;
  43526 }
  43527 __ai __attribute__((target("bf16,neon"))) poly128_t vreinterpretq_p128_bf16(bfloat16x8_t __p0) {
  43528   poly128_t __ret;
  43529   __ret = (poly128_t)(__p0);
  43530   return __ret;
  43531 }
  43532 __ai __attribute__((target("bf16,neon"))) poly64x2_t vreinterpretq_p64_bf16(bfloat16x8_t __p0) {
  43533   poly64x2_t __ret;
  43534   __ret = (poly64x2_t)(__p0);
  43535   return __ret;
  43536 }
  43537 __ai __attribute__((target("bf16,neon"))) poly16x8_t vreinterpretq_p16_bf16(bfloat16x8_t __p0) {
  43538   poly16x8_t __ret;
  43539   __ret = (poly16x8_t)(__p0);
  43540   return __ret;
  43541 }
  43542 __ai __attribute__((target("bf16,neon"))) uint8x16_t vreinterpretq_u8_bf16(bfloat16x8_t __p0) {
  43543   uint8x16_t __ret;
  43544   __ret = (uint8x16_t)(__p0);
  43545   return __ret;
  43546 }
  43547 __ai __attribute__((target("bf16,neon"))) uint32x4_t vreinterpretq_u32_bf16(bfloat16x8_t __p0) {
  43548   uint32x4_t __ret;
  43549   __ret = (uint32x4_t)(__p0);
  43550   return __ret;
  43551 }
  43552 __ai __attribute__((target("bf16,neon"))) uint64x2_t vreinterpretq_u64_bf16(bfloat16x8_t __p0) {
  43553   uint64x2_t __ret;
  43554   __ret = (uint64x2_t)(__p0);
  43555   return __ret;
  43556 }
  43557 __ai __attribute__((target("bf16,neon"))) uint16x8_t vreinterpretq_u16_bf16(bfloat16x8_t __p0) {
  43558   uint16x8_t __ret;
  43559   __ret = (uint16x8_t)(__p0);
  43560   return __ret;
  43561 }
  43562 __ai __attribute__((target("bf16,neon"))) int8x16_t vreinterpretq_s8_bf16(bfloat16x8_t __p0) {
  43563   int8x16_t __ret;
  43564   __ret = (int8x16_t)(__p0);
  43565   return __ret;
  43566 }
  43567 __ai __attribute__((target("bf16,neon"))) float64x2_t vreinterpretq_f64_bf16(bfloat16x8_t __p0) {
  43568   float64x2_t __ret;
  43569   __ret = (float64x2_t)(__p0);
  43570   return __ret;
  43571 }
  43572 __ai __attribute__((target("bf16,neon"))) float32x4_t vreinterpretq_f32_bf16(bfloat16x8_t __p0) {
  43573   float32x4_t __ret;
  43574   __ret = (float32x4_t)(__p0);
  43575   return __ret;
  43576 }
  43577 __ai __attribute__((target("bf16,neon"))) float16x8_t vreinterpretq_f16_bf16(bfloat16x8_t __p0) {
  43578   float16x8_t __ret;
  43579   __ret = (float16x8_t)(__p0);
  43580   return __ret;
  43581 }
  43582 __ai __attribute__((target("bf16,neon"))) int32x4_t vreinterpretq_s32_bf16(bfloat16x8_t __p0) {
  43583   int32x4_t __ret;
  43584   __ret = (int32x4_t)(__p0);
  43585   return __ret;
  43586 }
  43587 __ai __attribute__((target("bf16,neon"))) int64x2_t vreinterpretq_s64_bf16(bfloat16x8_t __p0) {
  43588   int64x2_t __ret;
  43589   __ret = (int64x2_t)(__p0);
  43590   return __ret;
  43591 }
  43592 __ai __attribute__((target("bf16,neon"))) int16x8_t vreinterpretq_s16_bf16(bfloat16x8_t __p0) {
  43593   int16x8_t __ret;
  43594   __ret = (int16x8_t)(__p0);
  43595   return __ret;
  43596 }
  43597 __ai __attribute__((target("bf16,neon"))) uint8x8_t vreinterpret_u8_bf16(bfloat16x4_t __p0) {
  43598   uint8x8_t __ret;
  43599   __ret = (uint8x8_t)(__p0);
  43600   return __ret;
  43601 }
  43602 __ai __attribute__((target("bf16,neon"))) uint32x2_t vreinterpret_u32_bf16(bfloat16x4_t __p0) {
  43603   uint32x2_t __ret;
  43604   __ret = (uint32x2_t)(__p0);
  43605   return __ret;
  43606 }
  43607 __ai __attribute__((target("bf16,neon"))) uint64x1_t vreinterpret_u64_bf16(bfloat16x4_t __p0) {
  43608   uint64x1_t __ret;
  43609   __ret = (uint64x1_t)(__p0);
  43610   return __ret;
  43611 }
  43612 __ai __attribute__((target("bf16,neon"))) uint16x4_t vreinterpret_u16_bf16(bfloat16x4_t __p0) {
  43613   uint16x4_t __ret;
  43614   __ret = (uint16x4_t)(__p0);
  43615   return __ret;
  43616 }
  43617 __ai __attribute__((target("bf16,neon"))) int8x8_t vreinterpret_s8_bf16(bfloat16x4_t __p0) {
  43618   int8x8_t __ret;
  43619   __ret = (int8x8_t)(__p0);
  43620   return __ret;
  43621 }
  43622 __ai __attribute__((target("bf16,neon"))) float64x1_t vreinterpret_f64_bf16(bfloat16x4_t __p0) {
  43623   float64x1_t __ret;
  43624   __ret = (float64x1_t)(__p0);
  43625   return __ret;
  43626 }
  43627 __ai __attribute__((target("bf16,neon"))) float32x2_t vreinterpret_f32_bf16(bfloat16x4_t __p0) {
  43628   float32x2_t __ret;
  43629   __ret = (float32x2_t)(__p0);
  43630   return __ret;
  43631 }
  43632 __ai __attribute__((target("bf16,neon"))) float16x4_t vreinterpret_f16_bf16(bfloat16x4_t __p0) {
  43633   float16x4_t __ret;
  43634   __ret = (float16x4_t)(__p0);
  43635   return __ret;
  43636 }
  43637 __ai __attribute__((target("bf16,neon"))) int32x2_t vreinterpret_s32_bf16(bfloat16x4_t __p0) {
  43638   int32x2_t __ret;
  43639   __ret = (int32x2_t)(__p0);
  43640   return __ret;
  43641 }
  43642 __ai __attribute__((target("bf16,neon"))) int64x1_t vreinterpret_s64_bf16(bfloat16x4_t __p0) {
  43643   int64x1_t __ret;
  43644   __ret = (int64x1_t)(__p0);
  43645   return __ret;
  43646 }
  43647 __ai __attribute__((target("bf16,neon"))) int16x4_t vreinterpret_s16_bf16(bfloat16x4_t __p0) {
  43648   int16x4_t __ret;
  43649   __ret = (int16x4_t)(__p0);
  43650   return __ret;
  43651 }
  43652 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p8(poly8x16_t __p0) {
  43653   bfloat16x8_t __ret;
  43654   __ret = (bfloat16x8_t)(__p0);
  43655   return __ret;
  43656 }
  43657 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p128(poly128_t __p0) {
  43658   bfloat16x8_t __ret;
  43659   __ret = (bfloat16x8_t)(__p0);
  43660   return __ret;
  43661 }
  43662 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p64(poly64x2_t __p0) {
  43663   bfloat16x8_t __ret;
  43664   __ret = (bfloat16x8_t)(__p0);
  43665   return __ret;
  43666 }
  43667 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p16(poly16x8_t __p0) {
  43668   bfloat16x8_t __ret;
  43669   __ret = (bfloat16x8_t)(__p0);
  43670   return __ret;
  43671 }
  43672 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u8(uint8x16_t __p0) {
  43673   bfloat16x8_t __ret;
  43674   __ret = (bfloat16x8_t)(__p0);
  43675   return __ret;
  43676 }
  43677 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u32(uint32x4_t __p0) {
  43678   bfloat16x8_t __ret;
  43679   __ret = (bfloat16x8_t)(__p0);
  43680   return __ret;
  43681 }
  43682 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u64(uint64x2_t __p0) {
  43683   bfloat16x8_t __ret;
  43684   __ret = (bfloat16x8_t)(__p0);
  43685   return __ret;
  43686 }
  43687 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u16(uint16x8_t __p0) {
  43688   bfloat16x8_t __ret;
  43689   __ret = (bfloat16x8_t)(__p0);
  43690   return __ret;
  43691 }
  43692 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s8(int8x16_t __p0) {
  43693   bfloat16x8_t __ret;
  43694   __ret = (bfloat16x8_t)(__p0);
  43695   return __ret;
  43696 }
  43697 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f64(float64x2_t __p0) {
  43698   bfloat16x8_t __ret;
  43699   __ret = (bfloat16x8_t)(__p0);
  43700   return __ret;
  43701 }
  43702 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f32(float32x4_t __p0) {
  43703   bfloat16x8_t __ret;
  43704   __ret = (bfloat16x8_t)(__p0);
  43705   return __ret;
  43706 }
  43707 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f16(float16x8_t __p0) {
  43708   bfloat16x8_t __ret;
  43709   __ret = (bfloat16x8_t)(__p0);
  43710   return __ret;
  43711 }
  43712 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s32(int32x4_t __p0) {
  43713   bfloat16x8_t __ret;
  43714   __ret = (bfloat16x8_t)(__p0);
  43715   return __ret;
  43716 }
  43717 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s64(int64x2_t __p0) {
  43718   bfloat16x8_t __ret;
  43719   __ret = (bfloat16x8_t)(__p0);
  43720   return __ret;
  43721 }
  43722 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s16(int16x8_t __p0) {
  43723   bfloat16x8_t __ret;
  43724   __ret = (bfloat16x8_t)(__p0);
  43725   return __ret;
  43726 }
  43727 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p8(poly8x8_t __p0) {
  43728   bfloat16x4_t __ret;
  43729   __ret = (bfloat16x4_t)(__p0);
  43730   return __ret;
  43731 }
  43732 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p64(poly64x1_t __p0) {
  43733   bfloat16x4_t __ret;
  43734   __ret = (bfloat16x4_t)(__p0);
  43735   return __ret;
  43736 }
  43737 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p16(poly16x4_t __p0) {
  43738   bfloat16x4_t __ret;
  43739   __ret = (bfloat16x4_t)(__p0);
  43740   return __ret;
  43741 }
  43742 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u8(uint8x8_t __p0) {
  43743   bfloat16x4_t __ret;
  43744   __ret = (bfloat16x4_t)(__p0);
  43745   return __ret;
  43746 }
  43747 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u32(uint32x2_t __p0) {
  43748   bfloat16x4_t __ret;
  43749   __ret = (bfloat16x4_t)(__p0);
  43750   return __ret;
  43751 }
  43752 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u64(uint64x1_t __p0) {
  43753   bfloat16x4_t __ret;
  43754   __ret = (bfloat16x4_t)(__p0);
  43755   return __ret;
  43756 }
  43757 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u16(uint16x4_t __p0) {
  43758   bfloat16x4_t __ret;
  43759   __ret = (bfloat16x4_t)(__p0);
  43760   return __ret;
  43761 }
  43762 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s8(int8x8_t __p0) {
  43763   bfloat16x4_t __ret;
  43764   __ret = (bfloat16x4_t)(__p0);
  43765   return __ret;
  43766 }
  43767 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f64(float64x1_t __p0) {
  43768   bfloat16x4_t __ret;
  43769   __ret = (bfloat16x4_t)(__p0);
  43770   return __ret;
  43771 }
  43772 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f32(float32x2_t __p0) {
  43773   bfloat16x4_t __ret;
  43774   __ret = (bfloat16x4_t)(__p0);
  43775   return __ret;
  43776 }
  43777 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f16(float16x4_t __p0) {
  43778   bfloat16x4_t __ret;
  43779   __ret = (bfloat16x4_t)(__p0);
  43780   return __ret;
  43781 }
  43782 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s32(int32x2_t __p0) {
  43783   bfloat16x4_t __ret;
  43784   __ret = (bfloat16x4_t)(__p0);
  43785   return __ret;
  43786 }
  43787 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s64(int64x1_t __p0) {
  43788   bfloat16x4_t __ret;
  43789   __ret = (bfloat16x4_t)(__p0);
  43790   return __ret;
  43791 }
  43792 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s16(int16x4_t __p0) {
  43793   bfloat16x4_t __ret;
  43794   __ret = (bfloat16x4_t)(__p0);
  43795   return __ret;
  43796 }
  43797 #ifdef __LITTLE_ENDIAN__
  43798 #define vdotq_laneq_u32(__p0_238, __p1_238, __p2_238, __p3_238) __extension__ ({ \
  43799   uint32x4_t __ret_238; \
  43800   uint32x4_t __s0_238 = __p0_238; \
  43801   uint8x16_t __s1_238 = __p1_238; \
  43802   uint8x16_t __s2_238 = __p2_238; \
  43803   __ret_238 = vdotq_u32(__s0_238, __s1_238, __builtin_bit_cast(uint8x16_t, splatq_laneq_u32(__builtin_bit_cast(uint32x4_t, __s2_238), __p3_238))); \
  43804   __ret_238; \
  43805 })
  43806 #else
  43807 #define vdotq_laneq_u32(__p0_239, __p1_239, __p2_239, __p3_239) __extension__ ({ \
  43808   uint32x4_t __ret_239; \
  43809   uint32x4_t __s0_239 = __p0_239; \
  43810   uint8x16_t __s1_239 = __p1_239; \
  43811   uint8x16_t __s2_239 = __p2_239; \
  43812   uint32x4_t __rev0_239;  __rev0_239 = __builtin_shufflevector(__s0_239, __s0_239, 3, 2, 1, 0); \
  43813   uint8x16_t __rev1_239;  __rev1_239 = __builtin_shufflevector(__s1_239, __s1_239, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43814   uint8x16_t __rev2_239;  __rev2_239 = __builtin_shufflevector(__s2_239, __s2_239, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43815   __ret_239 = __noswap_vdotq_u32(__rev0_239, __rev1_239, __builtin_bit_cast(uint8x16_t, __noswap_splatq_laneq_u32(__builtin_bit_cast(uint32x4_t, __rev2_239), __p3_239))); \
  43816   __ret_239 = __builtin_shufflevector(__ret_239, __ret_239, 3, 2, 1, 0); \
  43817   __ret_239; \
  43818 })
  43819 #endif
  43820 
  43821 #ifdef __LITTLE_ENDIAN__
  43822 #define vdotq_laneq_s32(__p0_240, __p1_240, __p2_240, __p3_240) __extension__ ({ \
  43823   int32x4_t __ret_240; \
  43824   int32x4_t __s0_240 = __p0_240; \
  43825   int8x16_t __s1_240 = __p1_240; \
  43826   int8x16_t __s2_240 = __p2_240; \
  43827   __ret_240 = vdotq_s32(__s0_240, __s1_240, __builtin_bit_cast(int8x16_t, splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_240), __p3_240))); \
  43828   __ret_240; \
  43829 })
  43830 #else
  43831 #define vdotq_laneq_s32(__p0_241, __p1_241, __p2_241, __p3_241) __extension__ ({ \
  43832   int32x4_t __ret_241; \
  43833   int32x4_t __s0_241 = __p0_241; \
  43834   int8x16_t __s1_241 = __p1_241; \
  43835   int8x16_t __s2_241 = __p2_241; \
  43836   int32x4_t __rev0_241;  __rev0_241 = __builtin_shufflevector(__s0_241, __s0_241, 3, 2, 1, 0); \
  43837   int8x16_t __rev1_241;  __rev1_241 = __builtin_shufflevector(__s1_241, __s1_241, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43838   int8x16_t __rev2_241;  __rev2_241 = __builtin_shufflevector(__s2_241, __s2_241, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43839   __ret_241 = __noswap_vdotq_s32(__rev0_241, __rev1_241, __builtin_bit_cast(int8x16_t, __noswap_splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_241), __p3_241))); \
  43840   __ret_241 = __builtin_shufflevector(__ret_241, __ret_241, 3, 2, 1, 0); \
  43841   __ret_241; \
  43842 })
  43843 #endif
  43844 
  43845 #ifdef __LITTLE_ENDIAN__
  43846 #define vdot_laneq_u32(__p0_242, __p1_242, __p2_242, __p3_242) __extension__ ({ \
  43847   uint32x2_t __ret_242; \
  43848   uint32x2_t __s0_242 = __p0_242; \
  43849   uint8x8_t __s1_242 = __p1_242; \
  43850   uint8x16_t __s2_242 = __p2_242; \
  43851   __ret_242 = vdot_u32(__s0_242, __s1_242, __builtin_bit_cast(uint8x8_t, splat_laneq_u32(__builtin_bit_cast(uint32x4_t, __s2_242), __p3_242))); \
  43852   __ret_242; \
  43853 })
  43854 #else
  43855 #define vdot_laneq_u32(__p0_243, __p1_243, __p2_243, __p3_243) __extension__ ({ \
  43856   uint32x2_t __ret_243; \
  43857   uint32x2_t __s0_243 = __p0_243; \
  43858   uint8x8_t __s1_243 = __p1_243; \
  43859   uint8x16_t __s2_243 = __p2_243; \
  43860   uint32x2_t __rev0_243;  __rev0_243 = __builtin_shufflevector(__s0_243, __s0_243, 1, 0); \
  43861   uint8x8_t __rev1_243;  __rev1_243 = __builtin_shufflevector(__s1_243, __s1_243, 7, 6, 5, 4, 3, 2, 1, 0); \
  43862   uint8x16_t __rev2_243;  __rev2_243 = __builtin_shufflevector(__s2_243, __s2_243, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43863   __ret_243 = __noswap_vdot_u32(__rev0_243, __rev1_243, __builtin_bit_cast(uint8x8_t, __noswap_splat_laneq_u32(__builtin_bit_cast(uint32x4_t, __rev2_243), __p3_243))); \
  43864   __ret_243 = __builtin_shufflevector(__ret_243, __ret_243, 1, 0); \
  43865   __ret_243; \
  43866 })
  43867 #endif
  43868 
  43869 #ifdef __LITTLE_ENDIAN__
  43870 #define vdot_laneq_s32(__p0_244, __p1_244, __p2_244, __p3_244) __extension__ ({ \
  43871   int32x2_t __ret_244; \
  43872   int32x2_t __s0_244 = __p0_244; \
  43873   int8x8_t __s1_244 = __p1_244; \
  43874   int8x16_t __s2_244 = __p2_244; \
  43875   __ret_244 = vdot_s32(__s0_244, __s1_244, __builtin_bit_cast(int8x8_t, splat_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_244), __p3_244))); \
  43876   __ret_244; \
  43877 })
  43878 #else
  43879 #define vdot_laneq_s32(__p0_245, __p1_245, __p2_245, __p3_245) __extension__ ({ \
  43880   int32x2_t __ret_245; \
  43881   int32x2_t __s0_245 = __p0_245; \
  43882   int8x8_t __s1_245 = __p1_245; \
  43883   int8x16_t __s2_245 = __p2_245; \
  43884   int32x2_t __rev0_245;  __rev0_245 = __builtin_shufflevector(__s0_245, __s0_245, 1, 0); \
  43885   int8x8_t __rev1_245;  __rev1_245 = __builtin_shufflevector(__s1_245, __s1_245, 7, 6, 5, 4, 3, 2, 1, 0); \
  43886   int8x16_t __rev2_245;  __rev2_245 = __builtin_shufflevector(__s2_245, __s2_245, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  43887   __ret_245 = __noswap_vdot_s32(__rev0_245, __rev1_245, __builtin_bit_cast(int8x8_t, __noswap_splat_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_245), __p3_245))); \
  43888   __ret_245 = __builtin_shufflevector(__ret_245, __ret_245, 1, 0); \
  43889   __ret_245; \
  43890 })
  43891 #endif
  43892 
  43893 #ifdef __LITTLE_ENDIAN__
  43894 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43895   float32x4_t __ret;
  43896   __ret = (float32x4_t) __builtin_neon_vfmlalq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  43897   return __ret;
  43898 }
  43899 #else
  43900 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43901   float32x4_t __ret;
  43902   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43903   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  43904   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  43905   __ret = (float32x4_t) __builtin_neon_vfmlalq_high_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  43906   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43907   return __ret;
  43908 }
  43909 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlalq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43910   float32x4_t __ret;
  43911   __ret = (float32x4_t) __builtin_neon_vfmlalq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  43912   return __ret;
  43913 }
  43914 #endif
  43915 
  43916 #ifdef __LITTLE_ENDIAN__
  43917 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  43918   float32x2_t __ret;
  43919   __ret = (float32x2_t) __builtin_neon_vfmlal_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  43920   return __ret;
  43921 }
  43922 #else
  43923 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  43924   float32x2_t __ret;
  43925   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  43926   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43927   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  43928   __ret = (float32x2_t) __builtin_neon_vfmlal_high_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  43929   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  43930   return __ret;
  43931 }
  43932 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlal_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  43933   float32x2_t __ret;
  43934   __ret = (float32x2_t) __builtin_neon_vfmlal_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  43935   return __ret;
  43936 }
  43937 #endif
  43938 
  43939 #ifdef __LITTLE_ENDIAN__
  43940 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43941   float32x4_t __ret;
  43942   __ret = (float32x4_t) __builtin_neon_vfmlalq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  43943   return __ret;
  43944 }
  43945 #else
  43946 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43947   float32x4_t __ret;
  43948   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43949   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  43950   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  43951   __ret = (float32x4_t) __builtin_neon_vfmlalq_low_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  43952   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43953   return __ret;
  43954 }
  43955 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlalq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43956   float32x4_t __ret;
  43957   __ret = (float32x4_t) __builtin_neon_vfmlalq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  43958   return __ret;
  43959 }
  43960 #endif
  43961 
  43962 #ifdef __LITTLE_ENDIAN__
  43963 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  43964   float32x2_t __ret;
  43965   __ret = (float32x2_t) __builtin_neon_vfmlal_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  43966   return __ret;
  43967 }
  43968 #else
  43969 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  43970   float32x2_t __ret;
  43971   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  43972   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  43973   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  43974   __ret = (float32x2_t) __builtin_neon_vfmlal_low_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  43975   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  43976   return __ret;
  43977 }
  43978 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlal_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  43979   float32x2_t __ret;
  43980   __ret = (float32x2_t) __builtin_neon_vfmlal_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  43981   return __ret;
  43982 }
  43983 #endif
  43984 
  43985 #ifdef __LITTLE_ENDIAN__
  43986 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43987   float32x4_t __ret;
  43988   __ret = (float32x4_t) __builtin_neon_vfmlslq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  43989   return __ret;
  43990 }
  43991 #else
  43992 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  43993   float32x4_t __ret;
  43994   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  43995   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  43996   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  43997   __ret = (float32x4_t) __builtin_neon_vfmlslq_high_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  43998   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  43999   return __ret;
  44000 }
  44001 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlslq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  44002   float32x4_t __ret;
  44003   __ret = (float32x4_t) __builtin_neon_vfmlslq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  44004   return __ret;
  44005 }
  44006 #endif
  44007 
  44008 #ifdef __LITTLE_ENDIAN__
  44009 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  44010   float32x2_t __ret;
  44011   __ret = (float32x2_t) __builtin_neon_vfmlsl_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  44012   return __ret;
  44013 }
  44014 #else
  44015 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  44016   float32x2_t __ret;
  44017   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  44018   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  44019   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  44020   __ret = (float32x2_t) __builtin_neon_vfmlsl_high_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  44021   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  44022   return __ret;
  44023 }
  44024 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlsl_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  44025   float32x2_t __ret;
  44026   __ret = (float32x2_t) __builtin_neon_vfmlsl_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  44027   return __ret;
  44028 }
  44029 #endif
  44030 
  44031 #ifdef __LITTLE_ENDIAN__
  44032 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  44033   float32x4_t __ret;
  44034   __ret = (float32x4_t) __builtin_neon_vfmlslq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  44035   return __ret;
  44036 }
  44037 #else
  44038 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  44039   float32x4_t __ret;
  44040   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  44041   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44042   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  44043   __ret = (float32x4_t) __builtin_neon_vfmlslq_low_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41);
  44044   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  44045   return __ret;
  44046 }
  44047 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlslq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) {
  44048   float32x4_t __ret;
  44049   __ret = (float32x4_t) __builtin_neon_vfmlslq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41);
  44050   return __ret;
  44051 }
  44052 #endif
  44053 
  44054 #ifdef __LITTLE_ENDIAN__
  44055 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  44056   float32x2_t __ret;
  44057   __ret = (float32x2_t) __builtin_neon_vfmlsl_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  44058   return __ret;
  44059 }
  44060 #else
  44061 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  44062   float32x2_t __ret;
  44063   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  44064   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  44065   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  44066   __ret = (float32x2_t) __builtin_neon_vfmlsl_low_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9);
  44067   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  44068   return __ret;
  44069 }
  44070 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlsl_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) {
  44071   float32x2_t __ret;
  44072   __ret = (float32x2_t) __builtin_neon_vfmlsl_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9);
  44073   return __ret;
  44074 }
  44075 #endif
  44076 
  44077 #ifdef __LITTLE_ENDIAN__
  44078 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vdivq_f16(float16x8_t __p0, float16x8_t __p1) {
  44079   float16x8_t __ret;
  44080   __ret = __p0 / __p1;
  44081   return __ret;
  44082 }
  44083 #else
  44084 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vdivq_f16(float16x8_t __p0, float16x8_t __p1) {
  44085   float16x8_t __ret;
  44086   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  44087   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44088   __ret = __rev0 / __rev1;
  44089   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  44090   return __ret;
  44091 }
  44092 #endif
  44093 
  44094 #ifdef __LITTLE_ENDIAN__
  44095 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vdiv_f16(float16x4_t __p0, float16x4_t __p1) {
  44096   float16x4_t __ret;
  44097   __ret = __p0 / __p1;
  44098   return __ret;
  44099 }
  44100 #else
  44101 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vdiv_f16(float16x4_t __p0, float16x4_t __p1) {
  44102   float16x4_t __ret;
  44103   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  44104   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  44105   __ret = __rev0 / __rev1;
  44106   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  44107   return __ret;
  44108 }
  44109 #endif
  44110 
  44111 #ifdef __LITTLE_ENDIAN__
  44112 #define vfmah_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44113   float16_t __ret; \
  44114   float16_t __s0 = __p0; \
  44115   float16_t __s1 = __p1; \
  44116   float16x4_t __s2 = __p2; \
  44117   __ret = (float16_t) __builtin_neon_vfmah_lane_f16(__s0, __s1, (float16x4_t)__s2, __p3); \
  44118   __ret; \
  44119 })
  44120 #else
  44121 #define vfmah_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44122   float16_t __ret; \
  44123   float16_t __s0 = __p0; \
  44124   float16_t __s1 = __p1; \
  44125   float16x4_t __s2 = __p2; \
  44126   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  44127   __ret = (float16_t) __builtin_neon_vfmah_lane_f16(__s0, __s1, (float16x4_t)__rev2, __p3); \
  44128   __ret; \
  44129 })
  44130 #define __noswap_vfmah_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44131   float16_t __ret; \
  44132   float16_t __s0 = __p0; \
  44133   float16_t __s1 = __p1; \
  44134   float16x4_t __s2 = __p2; \
  44135   __ret = (float16_t) __builtin_neon_vfmah_lane_f16(__s0, __s1, (float16x4_t)__s2, __p3); \
  44136   __ret; \
  44137 })
  44138 #endif
  44139 
  44140 #ifdef __LITTLE_ENDIAN__
  44141 #define vfmaq_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44142   float16x8_t __ret; \
  44143   float16x8_t __s0 = __p0; \
  44144   float16x8_t __s1 = __p1; \
  44145   float16x4_t __s2 = __p2; \
  44146   __ret = (float16x8_t) __builtin_neon_vfmaq_lane_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 40); \
  44147   __ret; \
  44148 })
  44149 #else
  44150 #define vfmaq_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44151   float16x8_t __ret; \
  44152   float16x8_t __s0 = __p0; \
  44153   float16x8_t __s1 = __p1; \
  44154   float16x4_t __s2 = __p2; \
  44155   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44156   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  44157   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  44158   __ret = (float16x8_t) __builtin_neon_vfmaq_lane_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, __p3, 40); \
  44159   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  44160   __ret; \
  44161 })
  44162 #define __noswap_vfmaq_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44163   float16x8_t __ret; \
  44164   float16x8_t __s0 = __p0; \
  44165   float16x8_t __s1 = __p1; \
  44166   float16x4_t __s2 = __p2; \
  44167   __ret = (float16x8_t) __builtin_neon_vfmaq_lane_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 40); \
  44168   __ret; \
  44169 })
  44170 #endif
  44171 
  44172 #ifdef __LITTLE_ENDIAN__
  44173 #define vfma_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44174   float16x4_t __ret; \
  44175   float16x4_t __s0 = __p0; \
  44176   float16x4_t __s1 = __p1; \
  44177   float16x4_t __s2 = __p2; \
  44178   __ret = (float16x4_t) __builtin_neon_vfma_lane_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 8); \
  44179   __ret; \
  44180 })
  44181 #else
  44182 #define vfma_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44183   float16x4_t __ret; \
  44184   float16x4_t __s0 = __p0; \
  44185   float16x4_t __s1 = __p1; \
  44186   float16x4_t __s2 = __p2; \
  44187   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44188   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  44189   float16x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  44190   __ret = (float16x4_t) __builtin_neon_vfma_lane_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, __p3, 8); \
  44191   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  44192   __ret; \
  44193 })
  44194 #define __noswap_vfma_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44195   float16x4_t __ret; \
  44196   float16x4_t __s0 = __p0; \
  44197   float16x4_t __s1 = __p1; \
  44198   float16x4_t __s2 = __p2; \
  44199   __ret = (float16x4_t) __builtin_neon_vfma_lane_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 8); \
  44200   __ret; \
  44201 })
  44202 #endif
  44203 
  44204 #ifdef __LITTLE_ENDIAN__
  44205 #define vfmah_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44206   float16_t __ret; \
  44207   float16_t __s0 = __p0; \
  44208   float16_t __s1 = __p1; \
  44209   float16x8_t __s2 = __p2; \
  44210   __ret = (float16_t) __builtin_neon_vfmah_laneq_f16(__s0, __s1, (float16x8_t)__s2, __p3); \
  44211   __ret; \
  44212 })
  44213 #else
  44214 #define vfmah_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44215   float16_t __ret; \
  44216   float16_t __s0 = __p0; \
  44217   float16_t __s1 = __p1; \
  44218   float16x8_t __s2 = __p2; \
  44219   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  44220   __ret = (float16_t) __builtin_neon_vfmah_laneq_f16(__s0, __s1, (float16x8_t)__rev2, __p3); \
  44221   __ret; \
  44222 })
  44223 #define __noswap_vfmah_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44224   float16_t __ret; \
  44225   float16_t __s0 = __p0; \
  44226   float16_t __s1 = __p1; \
  44227   float16x8_t __s2 = __p2; \
  44228   __ret = (float16_t) __builtin_neon_vfmah_laneq_f16(__s0, __s1, (float16x8_t)__s2, __p3); \
  44229   __ret; \
  44230 })
  44231 #endif
  44232 
  44233 #ifdef __LITTLE_ENDIAN__
  44234 #define vfmaq_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44235   float16x8_t __ret; \
  44236   float16x8_t __s0 = __p0; \
  44237   float16x8_t __s1 = __p1; \
  44238   float16x8_t __s2 = __p2; \
  44239   __ret = (float16x8_t) __builtin_neon_vfmaq_laneq_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 40); \
  44240   __ret; \
  44241 })
  44242 #else
  44243 #define vfmaq_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44244   float16x8_t __ret; \
  44245   float16x8_t __s0 = __p0; \
  44246   float16x8_t __s1 = __p1; \
  44247   float16x8_t __s2 = __p2; \
  44248   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44249   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  44250   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  44251   __ret = (float16x8_t) __builtin_neon_vfmaq_laneq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 40); \
  44252   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  44253   __ret; \
  44254 })
  44255 #define __noswap_vfmaq_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44256   float16x8_t __ret; \
  44257   float16x8_t __s0 = __p0; \
  44258   float16x8_t __s1 = __p1; \
  44259   float16x8_t __s2 = __p2; \
  44260   __ret = (float16x8_t) __builtin_neon_vfmaq_laneq_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 40); \
  44261   __ret; \
  44262 })
  44263 #endif
  44264 
  44265 #ifdef __LITTLE_ENDIAN__
  44266 #define vfma_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44267   float16x4_t __ret; \
  44268   float16x4_t __s0 = __p0; \
  44269   float16x4_t __s1 = __p1; \
  44270   float16x8_t __s2 = __p2; \
  44271   __ret = (float16x4_t) __builtin_neon_vfma_laneq_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 8); \
  44272   __ret; \
  44273 })
  44274 #else
  44275 #define vfma_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44276   float16x4_t __ret; \
  44277   float16x4_t __s0 = __p0; \
  44278   float16x4_t __s1 = __p1; \
  44279   float16x8_t __s2 = __p2; \
  44280   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44281   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  44282   float16x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  44283   __ret = (float16x4_t) __builtin_neon_vfma_laneq_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x16_t)__rev2, __p3, 8); \
  44284   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  44285   __ret; \
  44286 })
  44287 #define __noswap_vfma_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \
  44288   float16x4_t __ret; \
  44289   float16x4_t __s0 = __p0; \
  44290   float16x4_t __s1 = __p1; \
  44291   float16x8_t __s2 = __p2; \
  44292   __ret = (float16x4_t) __builtin_neon_vfma_laneq_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 8); \
  44293   __ret; \
  44294 })
  44295 #endif
  44296 
  44297 #ifdef __LITTLE_ENDIAN__
  44298 #define vfmaq_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44299   float16x8_t __ret; \
  44300   float16x8_t __s0 = __p0; \
  44301   float16x8_t __s1 = __p1; \
  44302   float16_t __s2 = __p2; \
  44303   __ret = vfmaq_f16(__s0, __s1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \
  44304   __ret; \
  44305 })
  44306 #else
  44307 #define vfmaq_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44308   float16x8_t __ret; \
  44309   float16x8_t __s0 = __p0; \
  44310   float16x8_t __s1 = __p1; \
  44311   float16_t __s2 = __p2; \
  44312   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44313   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  44314   __ret = __noswap_vfmaq_f16(__rev0, __rev1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \
  44315   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  44316   __ret; \
  44317 })
  44318 #endif
  44319 
  44320 #ifdef __LITTLE_ENDIAN__
  44321 #define vfma_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44322   float16x4_t __ret; \
  44323   float16x4_t __s0 = __p0; \
  44324   float16x4_t __s1 = __p1; \
  44325   float16_t __s2 = __p2; \
  44326   __ret = vfma_f16(__s0, __s1, (float16x4_t) {__s2, __s2, __s2, __s2}); \
  44327   __ret; \
  44328 })
  44329 #else
  44330 #define vfma_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44331   float16x4_t __ret; \
  44332   float16x4_t __s0 = __p0; \
  44333   float16x4_t __s1 = __p1; \
  44334   float16_t __s2 = __p2; \
  44335   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44336   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  44337   __ret = __noswap_vfma_f16(__rev0, __rev1, (float16x4_t) {__s2, __s2, __s2, __s2}); \
  44338   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  44339   __ret; \
  44340 })
  44341 #endif
  44342 
  44343 #ifdef __LITTLE_ENDIAN__
  44344 #define vfmsh_lane_f16(__p0_246, __p1_246, __p2_246, __p3_246) __extension__ ({ \
  44345   float16_t __ret_246; \
  44346   float16_t __s0_246 = __p0_246; \
  44347   float16_t __s1_246 = __p1_246; \
  44348   float16x4_t __s2_246 = __p2_246; \
  44349   __ret_246 = vfmah_lane_f16(__s0_246, -__s1_246, __s2_246, __p3_246); \
  44350   __ret_246; \
  44351 })
  44352 #else
  44353 #define vfmsh_lane_f16(__p0_247, __p1_247, __p2_247, __p3_247) __extension__ ({ \
  44354   float16_t __ret_247; \
  44355   float16_t __s0_247 = __p0_247; \
  44356   float16_t __s1_247 = __p1_247; \
  44357   float16x4_t __s2_247 = __p2_247; \
  44358   float16x4_t __rev2_247;  __rev2_247 = __builtin_shufflevector(__s2_247, __s2_247, 3, 2, 1, 0); \
  44359   __ret_247 = __noswap_vfmah_lane_f16(__s0_247, -__s1_247, __rev2_247, __p3_247); \
  44360   __ret_247; \
  44361 })
  44362 #endif
  44363 
  44364 #ifdef __LITTLE_ENDIAN__
  44365 #define vfmsq_lane_f16(__p0_248, __p1_248, __p2_248, __p3_248) __extension__ ({ \
  44366   float16x8_t __ret_248; \
  44367   float16x8_t __s0_248 = __p0_248; \
  44368   float16x8_t __s1_248 = __p1_248; \
  44369   float16x4_t __s2_248 = __p2_248; \
  44370   __ret_248 = vfmaq_lane_f16(__s0_248, -__s1_248, __s2_248, __p3_248); \
  44371   __ret_248; \
  44372 })
  44373 #else
  44374 #define vfmsq_lane_f16(__p0_249, __p1_249, __p2_249, __p3_249) __extension__ ({ \
  44375   float16x8_t __ret_249; \
  44376   float16x8_t __s0_249 = __p0_249; \
  44377   float16x8_t __s1_249 = __p1_249; \
  44378   float16x4_t __s2_249 = __p2_249; \
  44379   float16x8_t __rev0_249;  __rev0_249 = __builtin_shufflevector(__s0_249, __s0_249, 7, 6, 5, 4, 3, 2, 1, 0); \
  44380   float16x8_t __rev1_249;  __rev1_249 = __builtin_shufflevector(__s1_249, __s1_249, 7, 6, 5, 4, 3, 2, 1, 0); \
  44381   float16x4_t __rev2_249;  __rev2_249 = __builtin_shufflevector(__s2_249, __s2_249, 3, 2, 1, 0); \
  44382   __ret_249 = __noswap_vfmaq_lane_f16(__rev0_249, -__rev1_249, __rev2_249, __p3_249); \
  44383   __ret_249 = __builtin_shufflevector(__ret_249, __ret_249, 7, 6, 5, 4, 3, 2, 1, 0); \
  44384   __ret_249; \
  44385 })
  44386 #endif
  44387 
  44388 #ifdef __LITTLE_ENDIAN__
  44389 #define vfms_lane_f16(__p0_250, __p1_250, __p2_250, __p3_250) __extension__ ({ \
  44390   float16x4_t __ret_250; \
  44391   float16x4_t __s0_250 = __p0_250; \
  44392   float16x4_t __s1_250 = __p1_250; \
  44393   float16x4_t __s2_250 = __p2_250; \
  44394   __ret_250 = vfma_lane_f16(__s0_250, -__s1_250, __s2_250, __p3_250); \
  44395   __ret_250; \
  44396 })
  44397 #else
  44398 #define vfms_lane_f16(__p0_251, __p1_251, __p2_251, __p3_251) __extension__ ({ \
  44399   float16x4_t __ret_251; \
  44400   float16x4_t __s0_251 = __p0_251; \
  44401   float16x4_t __s1_251 = __p1_251; \
  44402   float16x4_t __s2_251 = __p2_251; \
  44403   float16x4_t __rev0_251;  __rev0_251 = __builtin_shufflevector(__s0_251, __s0_251, 3, 2, 1, 0); \
  44404   float16x4_t __rev1_251;  __rev1_251 = __builtin_shufflevector(__s1_251, __s1_251, 3, 2, 1, 0); \
  44405   float16x4_t __rev2_251;  __rev2_251 = __builtin_shufflevector(__s2_251, __s2_251, 3, 2, 1, 0); \
  44406   __ret_251 = __noswap_vfma_lane_f16(__rev0_251, -__rev1_251, __rev2_251, __p3_251); \
  44407   __ret_251 = __builtin_shufflevector(__ret_251, __ret_251, 3, 2, 1, 0); \
  44408   __ret_251; \
  44409 })
  44410 #endif
  44411 
  44412 #ifdef __LITTLE_ENDIAN__
  44413 #define vfmsh_laneq_f16(__p0_252, __p1_252, __p2_252, __p3_252) __extension__ ({ \
  44414   float16_t __ret_252; \
  44415   float16_t __s0_252 = __p0_252; \
  44416   float16_t __s1_252 = __p1_252; \
  44417   float16x8_t __s2_252 = __p2_252; \
  44418   __ret_252 = vfmah_laneq_f16(__s0_252, -__s1_252, __s2_252, __p3_252); \
  44419   __ret_252; \
  44420 })
  44421 #else
  44422 #define vfmsh_laneq_f16(__p0_253, __p1_253, __p2_253, __p3_253) __extension__ ({ \
  44423   float16_t __ret_253; \
  44424   float16_t __s0_253 = __p0_253; \
  44425   float16_t __s1_253 = __p1_253; \
  44426   float16x8_t __s2_253 = __p2_253; \
  44427   float16x8_t __rev2_253;  __rev2_253 = __builtin_shufflevector(__s2_253, __s2_253, 7, 6, 5, 4, 3, 2, 1, 0); \
  44428   __ret_253 = __noswap_vfmah_laneq_f16(__s0_253, -__s1_253, __rev2_253, __p3_253); \
  44429   __ret_253; \
  44430 })
  44431 #endif
  44432 
  44433 #ifdef __LITTLE_ENDIAN__
  44434 #define vfmsq_laneq_f16(__p0_254, __p1_254, __p2_254, __p3_254) __extension__ ({ \
  44435   float16x8_t __ret_254; \
  44436   float16x8_t __s0_254 = __p0_254; \
  44437   float16x8_t __s1_254 = __p1_254; \
  44438   float16x8_t __s2_254 = __p2_254; \
  44439   __ret_254 = vfmaq_laneq_f16(__s0_254, -__s1_254, __s2_254, __p3_254); \
  44440   __ret_254; \
  44441 })
  44442 #else
  44443 #define vfmsq_laneq_f16(__p0_255, __p1_255, __p2_255, __p3_255) __extension__ ({ \
  44444   float16x8_t __ret_255; \
  44445   float16x8_t __s0_255 = __p0_255; \
  44446   float16x8_t __s1_255 = __p1_255; \
  44447   float16x8_t __s2_255 = __p2_255; \
  44448   float16x8_t __rev0_255;  __rev0_255 = __builtin_shufflevector(__s0_255, __s0_255, 7, 6, 5, 4, 3, 2, 1, 0); \
  44449   float16x8_t __rev1_255;  __rev1_255 = __builtin_shufflevector(__s1_255, __s1_255, 7, 6, 5, 4, 3, 2, 1, 0); \
  44450   float16x8_t __rev2_255;  __rev2_255 = __builtin_shufflevector(__s2_255, __s2_255, 7, 6, 5, 4, 3, 2, 1, 0); \
  44451   __ret_255 = __noswap_vfmaq_laneq_f16(__rev0_255, -__rev1_255, __rev2_255, __p3_255); \
  44452   __ret_255 = __builtin_shufflevector(__ret_255, __ret_255, 7, 6, 5, 4, 3, 2, 1, 0); \
  44453   __ret_255; \
  44454 })
  44455 #endif
  44456 
  44457 #ifdef __LITTLE_ENDIAN__
  44458 #define vfms_laneq_f16(__p0_256, __p1_256, __p2_256, __p3_256) __extension__ ({ \
  44459   float16x4_t __ret_256; \
  44460   float16x4_t __s0_256 = __p0_256; \
  44461   float16x4_t __s1_256 = __p1_256; \
  44462   float16x8_t __s2_256 = __p2_256; \
  44463   __ret_256 = vfma_laneq_f16(__s0_256, -__s1_256, __s2_256, __p3_256); \
  44464   __ret_256; \
  44465 })
  44466 #else
  44467 #define vfms_laneq_f16(__p0_257, __p1_257, __p2_257, __p3_257) __extension__ ({ \
  44468   float16x4_t __ret_257; \
  44469   float16x4_t __s0_257 = __p0_257; \
  44470   float16x4_t __s1_257 = __p1_257; \
  44471   float16x8_t __s2_257 = __p2_257; \
  44472   float16x4_t __rev0_257;  __rev0_257 = __builtin_shufflevector(__s0_257, __s0_257, 3, 2, 1, 0); \
  44473   float16x4_t __rev1_257;  __rev1_257 = __builtin_shufflevector(__s1_257, __s1_257, 3, 2, 1, 0); \
  44474   float16x8_t __rev2_257;  __rev2_257 = __builtin_shufflevector(__s2_257, __s2_257, 7, 6, 5, 4, 3, 2, 1, 0); \
  44475   __ret_257 = __noswap_vfma_laneq_f16(__rev0_257, -__rev1_257, __rev2_257, __p3_257); \
  44476   __ret_257 = __builtin_shufflevector(__ret_257, __ret_257, 3, 2, 1, 0); \
  44477   __ret_257; \
  44478 })
  44479 #endif
  44480 
  44481 #ifdef __LITTLE_ENDIAN__
  44482 #define vfmsq_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44483   float16x8_t __ret; \
  44484   float16x8_t __s0 = __p0; \
  44485   float16x8_t __s1 = __p1; \
  44486   float16_t __s2 = __p2; \
  44487   __ret = vfmaq_f16(__s0, -__s1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \
  44488   __ret; \
  44489 })
  44490 #else
  44491 #define vfmsq_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44492   float16x8_t __ret; \
  44493   float16x8_t __s0 = __p0; \
  44494   float16x8_t __s1 = __p1; \
  44495   float16_t __s2 = __p2; \
  44496   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44497   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  44498   __ret = __noswap_vfmaq_f16(__rev0, -__rev1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \
  44499   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  44500   __ret; \
  44501 })
  44502 #endif
  44503 
  44504 #ifdef __LITTLE_ENDIAN__
  44505 #define vfms_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44506   float16x4_t __ret; \
  44507   float16x4_t __s0 = __p0; \
  44508   float16x4_t __s1 = __p1; \
  44509   float16_t __s2 = __p2; \
  44510   __ret = vfma_f16(__s0, -__s1, (float16x4_t) {__s2, __s2, __s2, __s2}); \
  44511   __ret; \
  44512 })
  44513 #else
  44514 #define vfms_n_f16(__p0, __p1, __p2) __extension__ ({ \
  44515   float16x4_t __ret; \
  44516   float16x4_t __s0 = __p0; \
  44517   float16x4_t __s1 = __p1; \
  44518   float16_t __s2 = __p2; \
  44519   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44520   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  44521   __ret = __noswap_vfma_f16(__rev0, -__rev1, (float16x4_t) {__s2, __s2, __s2, __s2}); \
  44522   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  44523   __ret; \
  44524 })
  44525 #endif
  44526 
  44527 #ifdef __LITTLE_ENDIAN__
  44528 #define vmaxnmvq_f16(__p0) __extension__ ({ \
  44529   float16_t __ret; \
  44530   float16x8_t __s0 = __p0; \
  44531   __ret = (float16_t) __builtin_neon_vmaxnmvq_f16((int8x16_t)__s0); \
  44532   __ret; \
  44533 })
  44534 #else
  44535 #define vmaxnmvq_f16(__p0) __extension__ ({ \
  44536   float16_t __ret; \
  44537   float16x8_t __s0 = __p0; \
  44538   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44539   __ret = (float16_t) __builtin_neon_vmaxnmvq_f16((int8x16_t)__rev0); \
  44540   __ret; \
  44541 })
  44542 #endif
  44543 
  44544 #ifdef __LITTLE_ENDIAN__
  44545 #define vmaxnmv_f16(__p0) __extension__ ({ \
  44546   float16_t __ret; \
  44547   float16x4_t __s0 = __p0; \
  44548   __ret = (float16_t) __builtin_neon_vmaxnmv_f16((int8x8_t)__s0); \
  44549   __ret; \
  44550 })
  44551 #else
  44552 #define vmaxnmv_f16(__p0) __extension__ ({ \
  44553   float16_t __ret; \
  44554   float16x4_t __s0 = __p0; \
  44555   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44556   __ret = (float16_t) __builtin_neon_vmaxnmv_f16((int8x8_t)__rev0); \
  44557   __ret; \
  44558 })
  44559 #endif
  44560 
  44561 #ifdef __LITTLE_ENDIAN__
  44562 #define vmaxvq_f16(__p0) __extension__ ({ \
  44563   float16_t __ret; \
  44564   float16x8_t __s0 = __p0; \
  44565   __ret = (float16_t) __builtin_neon_vmaxvq_f16((int8x16_t)__s0); \
  44566   __ret; \
  44567 })
  44568 #else
  44569 #define vmaxvq_f16(__p0) __extension__ ({ \
  44570   float16_t __ret; \
  44571   float16x8_t __s0 = __p0; \
  44572   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44573   __ret = (float16_t) __builtin_neon_vmaxvq_f16((int8x16_t)__rev0); \
  44574   __ret; \
  44575 })
  44576 #endif
  44577 
  44578 #ifdef __LITTLE_ENDIAN__
  44579 #define vmaxv_f16(__p0) __extension__ ({ \
  44580   float16_t __ret; \
  44581   float16x4_t __s0 = __p0; \
  44582   __ret = (float16_t) __builtin_neon_vmaxv_f16((int8x8_t)__s0); \
  44583   __ret; \
  44584 })
  44585 #else
  44586 #define vmaxv_f16(__p0) __extension__ ({ \
  44587   float16_t __ret; \
  44588   float16x4_t __s0 = __p0; \
  44589   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44590   __ret = (float16_t) __builtin_neon_vmaxv_f16((int8x8_t)__rev0); \
  44591   __ret; \
  44592 })
  44593 #endif
  44594 
  44595 #ifdef __LITTLE_ENDIAN__
  44596 #define vminnmvq_f16(__p0) __extension__ ({ \
  44597   float16_t __ret; \
  44598   float16x8_t __s0 = __p0; \
  44599   __ret = (float16_t) __builtin_neon_vminnmvq_f16((int8x16_t)__s0); \
  44600   __ret; \
  44601 })
  44602 #else
  44603 #define vminnmvq_f16(__p0) __extension__ ({ \
  44604   float16_t __ret; \
  44605   float16x8_t __s0 = __p0; \
  44606   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44607   __ret = (float16_t) __builtin_neon_vminnmvq_f16((int8x16_t)__rev0); \
  44608   __ret; \
  44609 })
  44610 #endif
  44611 
  44612 #ifdef __LITTLE_ENDIAN__
  44613 #define vminnmv_f16(__p0) __extension__ ({ \
  44614   float16_t __ret; \
  44615   float16x4_t __s0 = __p0; \
  44616   __ret = (float16_t) __builtin_neon_vminnmv_f16((int8x8_t)__s0); \
  44617   __ret; \
  44618 })
  44619 #else
  44620 #define vminnmv_f16(__p0) __extension__ ({ \
  44621   float16_t __ret; \
  44622   float16x4_t __s0 = __p0; \
  44623   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44624   __ret = (float16_t) __builtin_neon_vminnmv_f16((int8x8_t)__rev0); \
  44625   __ret; \
  44626 })
  44627 #endif
  44628 
  44629 #ifdef __LITTLE_ENDIAN__
  44630 #define vminvq_f16(__p0) __extension__ ({ \
  44631   float16_t __ret; \
  44632   float16x8_t __s0 = __p0; \
  44633   __ret = (float16_t) __builtin_neon_vminvq_f16((int8x16_t)__s0); \
  44634   __ret; \
  44635 })
  44636 #else
  44637 #define vminvq_f16(__p0) __extension__ ({ \
  44638   float16_t __ret; \
  44639   float16x8_t __s0 = __p0; \
  44640   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44641   __ret = (float16_t) __builtin_neon_vminvq_f16((int8x16_t)__rev0); \
  44642   __ret; \
  44643 })
  44644 #endif
  44645 
  44646 #ifdef __LITTLE_ENDIAN__
  44647 #define vminv_f16(__p0) __extension__ ({ \
  44648   float16_t __ret; \
  44649   float16x4_t __s0 = __p0; \
  44650   __ret = (float16_t) __builtin_neon_vminv_f16((int8x8_t)__s0); \
  44651   __ret; \
  44652 })
  44653 #else
  44654 #define vminv_f16(__p0) __extension__ ({ \
  44655   float16_t __ret; \
  44656   float16x4_t __s0 = __p0; \
  44657   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44658   __ret = (float16_t) __builtin_neon_vminv_f16((int8x8_t)__rev0); \
  44659   __ret; \
  44660 })
  44661 #endif
  44662 
  44663 #ifdef __LITTLE_ENDIAN__
  44664 #define vmulq_laneq_f16(__p0_258, __p1_258, __p2_258) __extension__ ({ \
  44665   float16x8_t __ret_258; \
  44666   float16x8_t __s0_258 = __p0_258; \
  44667   float16x8_t __s1_258 = __p1_258; \
  44668   __ret_258 = __s0_258 * splatq_laneq_f16(__s1_258, __p2_258); \
  44669   __ret_258; \
  44670 })
  44671 #else
  44672 #define vmulq_laneq_f16(__p0_259, __p1_259, __p2_259) __extension__ ({ \
  44673   float16x8_t __ret_259; \
  44674   float16x8_t __s0_259 = __p0_259; \
  44675   float16x8_t __s1_259 = __p1_259; \
  44676   float16x8_t __rev0_259;  __rev0_259 = __builtin_shufflevector(__s0_259, __s0_259, 7, 6, 5, 4, 3, 2, 1, 0); \
  44677   float16x8_t __rev1_259;  __rev1_259 = __builtin_shufflevector(__s1_259, __s1_259, 7, 6, 5, 4, 3, 2, 1, 0); \
  44678   __ret_259 = __rev0_259 * __noswap_splatq_laneq_f16(__rev1_259, __p2_259); \
  44679   __ret_259 = __builtin_shufflevector(__ret_259, __ret_259, 7, 6, 5, 4, 3, 2, 1, 0); \
  44680   __ret_259; \
  44681 })
  44682 #endif
  44683 
  44684 #ifdef __LITTLE_ENDIAN__
  44685 #define vmul_laneq_f16(__p0_260, __p1_260, __p2_260) __extension__ ({ \
  44686   float16x4_t __ret_260; \
  44687   float16x4_t __s0_260 = __p0_260; \
  44688   float16x8_t __s1_260 = __p1_260; \
  44689   __ret_260 = __s0_260 * splat_laneq_f16(__s1_260, __p2_260); \
  44690   __ret_260; \
  44691 })
  44692 #else
  44693 #define vmul_laneq_f16(__p0_261, __p1_261, __p2_261) __extension__ ({ \
  44694   float16x4_t __ret_261; \
  44695   float16x4_t __s0_261 = __p0_261; \
  44696   float16x8_t __s1_261 = __p1_261; \
  44697   float16x4_t __rev0_261;  __rev0_261 = __builtin_shufflevector(__s0_261, __s0_261, 3, 2, 1, 0); \
  44698   float16x8_t __rev1_261;  __rev1_261 = __builtin_shufflevector(__s1_261, __s1_261, 7, 6, 5, 4, 3, 2, 1, 0); \
  44699   __ret_261 = __rev0_261 * __noswap_splat_laneq_f16(__rev1_261, __p2_261); \
  44700   __ret_261 = __builtin_shufflevector(__ret_261, __ret_261, 3, 2, 1, 0); \
  44701   __ret_261; \
  44702 })
  44703 #endif
  44704 
  44705 #ifdef __LITTLE_ENDIAN__
  44706 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulxq_f16(float16x8_t __p0, float16x8_t __p1) {
  44707   float16x8_t __ret;
  44708   __ret = (float16x8_t) __builtin_neon_vmulxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  44709   return __ret;
  44710 }
  44711 #else
  44712 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulxq_f16(float16x8_t __p0, float16x8_t __p1) {
  44713   float16x8_t __ret;
  44714   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  44715   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44716   __ret = (float16x8_t) __builtin_neon_vmulxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  44717   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  44718   return __ret;
  44719 }
  44720 __ai __attribute__((target("fullfp16,neon"))) float16x8_t __noswap_vmulxq_f16(float16x8_t __p0, float16x8_t __p1) {
  44721   float16x8_t __ret;
  44722   __ret = (float16x8_t) __builtin_neon_vmulxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  44723   return __ret;
  44724 }
  44725 #endif
  44726 
  44727 #ifdef __LITTLE_ENDIAN__
  44728 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmulx_f16(float16x4_t __p0, float16x4_t __p1) {
  44729   float16x4_t __ret;
  44730   __ret = (float16x4_t) __builtin_neon_vmulx_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  44731   return __ret;
  44732 }
  44733 #else
  44734 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmulx_f16(float16x4_t __p0, float16x4_t __p1) {
  44735   float16x4_t __ret;
  44736   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  44737   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  44738   __ret = (float16x4_t) __builtin_neon_vmulx_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  44739   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  44740   return __ret;
  44741 }
  44742 __ai __attribute__((target("fullfp16,neon"))) float16x4_t __noswap_vmulx_f16(float16x4_t __p0, float16x4_t __p1) {
  44743   float16x4_t __ret;
  44744   __ret = (float16x4_t) __builtin_neon_vmulx_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  44745   return __ret;
  44746 }
  44747 #endif
  44748 
  44749 #ifdef __LITTLE_ENDIAN__
  44750 #define vmulxh_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  44751   float16_t __ret; \
  44752   float16_t __s0 = __p0; \
  44753   float16x4_t __s1 = __p1; \
  44754   __ret = (float16_t) __builtin_neon_vmulxh_lane_f16(__s0, (float16x4_t)__s1, __p2); \
  44755   __ret; \
  44756 })
  44757 #else
  44758 #define vmulxh_lane_f16(__p0, __p1, __p2) __extension__ ({ \
  44759   float16_t __ret; \
  44760   float16_t __s0 = __p0; \
  44761   float16x4_t __s1 = __p1; \
  44762   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  44763   __ret = (float16_t) __builtin_neon_vmulxh_lane_f16(__s0, (float16x4_t)__rev1, __p2); \
  44764   __ret; \
  44765 })
  44766 #endif
  44767 
  44768 #ifdef __LITTLE_ENDIAN__
  44769 #define vmulxq_lane_f16(__p0_262, __p1_262, __p2_262) __extension__ ({ \
  44770   float16x8_t __ret_262; \
  44771   float16x8_t __s0_262 = __p0_262; \
  44772   float16x4_t __s1_262 = __p1_262; \
  44773   __ret_262 = vmulxq_f16(__s0_262, splatq_lane_f16(__s1_262, __p2_262)); \
  44774   __ret_262; \
  44775 })
  44776 #else
  44777 #define vmulxq_lane_f16(__p0_263, __p1_263, __p2_263) __extension__ ({ \
  44778   float16x8_t __ret_263; \
  44779   float16x8_t __s0_263 = __p0_263; \
  44780   float16x4_t __s1_263 = __p1_263; \
  44781   float16x8_t __rev0_263;  __rev0_263 = __builtin_shufflevector(__s0_263, __s0_263, 7, 6, 5, 4, 3, 2, 1, 0); \
  44782   float16x4_t __rev1_263;  __rev1_263 = __builtin_shufflevector(__s1_263, __s1_263, 3, 2, 1, 0); \
  44783   __ret_263 = __noswap_vmulxq_f16(__rev0_263, __noswap_splatq_lane_f16(__rev1_263, __p2_263)); \
  44784   __ret_263 = __builtin_shufflevector(__ret_263, __ret_263, 7, 6, 5, 4, 3, 2, 1, 0); \
  44785   __ret_263; \
  44786 })
  44787 #endif
  44788 
  44789 #ifdef __LITTLE_ENDIAN__
  44790 #define vmulx_lane_f16(__p0_264, __p1_264, __p2_264) __extension__ ({ \
  44791   float16x4_t __ret_264; \
  44792   float16x4_t __s0_264 = __p0_264; \
  44793   float16x4_t __s1_264 = __p1_264; \
  44794   __ret_264 = vmulx_f16(__s0_264, splat_lane_f16(__s1_264, __p2_264)); \
  44795   __ret_264; \
  44796 })
  44797 #else
  44798 #define vmulx_lane_f16(__p0_265, __p1_265, __p2_265) __extension__ ({ \
  44799   float16x4_t __ret_265; \
  44800   float16x4_t __s0_265 = __p0_265; \
  44801   float16x4_t __s1_265 = __p1_265; \
  44802   float16x4_t __rev0_265;  __rev0_265 = __builtin_shufflevector(__s0_265, __s0_265, 3, 2, 1, 0); \
  44803   float16x4_t __rev1_265;  __rev1_265 = __builtin_shufflevector(__s1_265, __s1_265, 3, 2, 1, 0); \
  44804   __ret_265 = __noswap_vmulx_f16(__rev0_265, __noswap_splat_lane_f16(__rev1_265, __p2_265)); \
  44805   __ret_265 = __builtin_shufflevector(__ret_265, __ret_265, 3, 2, 1, 0); \
  44806   __ret_265; \
  44807 })
  44808 #endif
  44809 
  44810 #ifdef __LITTLE_ENDIAN__
  44811 #define vmulxh_laneq_f16(__p0, __p1, __p2) __extension__ ({ \
  44812   float16_t __ret; \
  44813   float16_t __s0 = __p0; \
  44814   float16x8_t __s1 = __p1; \
  44815   __ret = (float16_t) __builtin_neon_vmulxh_laneq_f16(__s0, (float16x8_t)__s1, __p2); \
  44816   __ret; \
  44817 })
  44818 #else
  44819 #define vmulxh_laneq_f16(__p0, __p1, __p2) __extension__ ({ \
  44820   float16_t __ret; \
  44821   float16_t __s0 = __p0; \
  44822   float16x8_t __s1 = __p1; \
  44823   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  44824   __ret = (float16_t) __builtin_neon_vmulxh_laneq_f16(__s0, (float16x8_t)__rev1, __p2); \
  44825   __ret; \
  44826 })
  44827 #endif
  44828 
  44829 #ifdef __LITTLE_ENDIAN__
  44830 #define vmulxq_laneq_f16(__p0_266, __p1_266, __p2_266) __extension__ ({ \
  44831   float16x8_t __ret_266; \
  44832   float16x8_t __s0_266 = __p0_266; \
  44833   float16x8_t __s1_266 = __p1_266; \
  44834   __ret_266 = vmulxq_f16(__s0_266, splatq_laneq_f16(__s1_266, __p2_266)); \
  44835   __ret_266; \
  44836 })
  44837 #else
  44838 #define vmulxq_laneq_f16(__p0_267, __p1_267, __p2_267) __extension__ ({ \
  44839   float16x8_t __ret_267; \
  44840   float16x8_t __s0_267 = __p0_267; \
  44841   float16x8_t __s1_267 = __p1_267; \
  44842   float16x8_t __rev0_267;  __rev0_267 = __builtin_shufflevector(__s0_267, __s0_267, 7, 6, 5, 4, 3, 2, 1, 0); \
  44843   float16x8_t __rev1_267;  __rev1_267 = __builtin_shufflevector(__s1_267, __s1_267, 7, 6, 5, 4, 3, 2, 1, 0); \
  44844   __ret_267 = __noswap_vmulxq_f16(__rev0_267, __noswap_splatq_laneq_f16(__rev1_267, __p2_267)); \
  44845   __ret_267 = __builtin_shufflevector(__ret_267, __ret_267, 7, 6, 5, 4, 3, 2, 1, 0); \
  44846   __ret_267; \
  44847 })
  44848 #endif
  44849 
  44850 #ifdef __LITTLE_ENDIAN__
  44851 #define vmulx_laneq_f16(__p0_268, __p1_268, __p2_268) __extension__ ({ \
  44852   float16x4_t __ret_268; \
  44853   float16x4_t __s0_268 = __p0_268; \
  44854   float16x8_t __s1_268 = __p1_268; \
  44855   __ret_268 = vmulx_f16(__s0_268, splat_laneq_f16(__s1_268, __p2_268)); \
  44856   __ret_268; \
  44857 })
  44858 #else
  44859 #define vmulx_laneq_f16(__p0_269, __p1_269, __p2_269) __extension__ ({ \
  44860   float16x4_t __ret_269; \
  44861   float16x4_t __s0_269 = __p0_269; \
  44862   float16x8_t __s1_269 = __p1_269; \
  44863   float16x4_t __rev0_269;  __rev0_269 = __builtin_shufflevector(__s0_269, __s0_269, 3, 2, 1, 0); \
  44864   float16x8_t __rev1_269;  __rev1_269 = __builtin_shufflevector(__s1_269, __s1_269, 7, 6, 5, 4, 3, 2, 1, 0); \
  44865   __ret_269 = __noswap_vmulx_f16(__rev0_269, __noswap_splat_laneq_f16(__rev1_269, __p2_269)); \
  44866   __ret_269 = __builtin_shufflevector(__ret_269, __ret_269, 3, 2, 1, 0); \
  44867   __ret_269; \
  44868 })
  44869 #endif
  44870 
  44871 #ifdef __LITTLE_ENDIAN__
  44872 #define vmulxq_n_f16(__p0, __p1) __extension__ ({ \
  44873   float16x8_t __ret; \
  44874   float16x8_t __s0 = __p0; \
  44875   float16_t __s1 = __p1; \
  44876   __ret = vmulxq_f16(__s0, (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}); \
  44877   __ret; \
  44878 })
  44879 #else
  44880 #define vmulxq_n_f16(__p0, __p1) __extension__ ({ \
  44881   float16x8_t __ret; \
  44882   float16x8_t __s0 = __p0; \
  44883   float16_t __s1 = __p1; \
  44884   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  44885   __ret = __noswap_vmulxq_f16(__rev0, (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}); \
  44886   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  44887   __ret; \
  44888 })
  44889 #endif
  44890 
  44891 #ifdef __LITTLE_ENDIAN__
  44892 #define vmulx_n_f16(__p0, __p1) __extension__ ({ \
  44893   float16x4_t __ret; \
  44894   float16x4_t __s0 = __p0; \
  44895   float16_t __s1 = __p1; \
  44896   __ret = vmulx_f16(__s0, (float16x4_t) {__s1, __s1, __s1, __s1}); \
  44897   __ret; \
  44898 })
  44899 #else
  44900 #define vmulx_n_f16(__p0, __p1) __extension__ ({ \
  44901   float16x4_t __ret; \
  44902   float16x4_t __s0 = __p0; \
  44903   float16_t __s1 = __p1; \
  44904   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  44905   __ret = __noswap_vmulx_f16(__rev0, (float16x4_t) {__s1, __s1, __s1, __s1}); \
  44906   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  44907   __ret; \
  44908 })
  44909 #endif
  44910 
  44911 #ifdef __LITTLE_ENDIAN__
  44912 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpaddq_f16(float16x8_t __p0, float16x8_t __p1) {
  44913   float16x8_t __ret;
  44914   __ret = (float16x8_t) __builtin_neon_vpaddq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  44915   return __ret;
  44916 }
  44917 #else
  44918 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpaddq_f16(float16x8_t __p0, float16x8_t __p1) {
  44919   float16x8_t __ret;
  44920   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  44921   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44922   __ret = (float16x8_t) __builtin_neon_vpaddq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  44923   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  44924   return __ret;
  44925 }
  44926 #endif
  44927 
  44928 #ifdef __LITTLE_ENDIAN__
  44929 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxq_f16(float16x8_t __p0, float16x8_t __p1) {
  44930   float16x8_t __ret;
  44931   __ret = (float16x8_t) __builtin_neon_vpmaxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  44932   return __ret;
  44933 }
  44934 #else
  44935 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxq_f16(float16x8_t __p0, float16x8_t __p1) {
  44936   float16x8_t __ret;
  44937   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  44938   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44939   __ret = (float16x8_t) __builtin_neon_vpmaxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  44940   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  44941   return __ret;
  44942 }
  44943 #endif
  44944 
  44945 #ifdef __LITTLE_ENDIAN__
  44946 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  44947   float16x8_t __ret;
  44948   __ret = (float16x8_t) __builtin_neon_vpmaxnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  44949   return __ret;
  44950 }
  44951 #else
  44952 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  44953   float16x8_t __ret;
  44954   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  44955   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44956   __ret = (float16x8_t) __builtin_neon_vpmaxnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  44957   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  44958   return __ret;
  44959 }
  44960 #endif
  44961 
  44962 #ifdef __LITTLE_ENDIAN__
  44963 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmaxnm_f16(float16x4_t __p0, float16x4_t __p1) {
  44964   float16x4_t __ret;
  44965   __ret = (float16x4_t) __builtin_neon_vpmaxnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  44966   return __ret;
  44967 }
  44968 #else
  44969 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmaxnm_f16(float16x4_t __p0, float16x4_t __p1) {
  44970   float16x4_t __ret;
  44971   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  44972   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  44973   __ret = (float16x4_t) __builtin_neon_vpmaxnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  44974   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  44975   return __ret;
  44976 }
  44977 #endif
  44978 
  44979 #ifdef __LITTLE_ENDIAN__
  44980 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminq_f16(float16x8_t __p0, float16x8_t __p1) {
  44981   float16x8_t __ret;
  44982   __ret = (float16x8_t) __builtin_neon_vpminq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  44983   return __ret;
  44984 }
  44985 #else
  44986 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminq_f16(float16x8_t __p0, float16x8_t __p1) {
  44987   float16x8_t __ret;
  44988   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  44989   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  44990   __ret = (float16x8_t) __builtin_neon_vpminq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  44991   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  44992   return __ret;
  44993 }
  44994 #endif
  44995 
  44996 #ifdef __LITTLE_ENDIAN__
  44997 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  44998   float16x8_t __ret;
  44999   __ret = (float16x8_t) __builtin_neon_vpminnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40);
  45000   return __ret;
  45001 }
  45002 #else
  45003 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminnmq_f16(float16x8_t __p0, float16x8_t __p1) {
  45004   float16x8_t __ret;
  45005   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45006   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  45007   __ret = (float16x8_t) __builtin_neon_vpminnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40);
  45008   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  45009   return __ret;
  45010 }
  45011 #endif
  45012 
  45013 #ifdef __LITTLE_ENDIAN__
  45014 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpminnm_f16(float16x4_t __p0, float16x4_t __p1) {
  45015   float16x4_t __ret;
  45016   __ret = (float16x4_t) __builtin_neon_vpminnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8);
  45017   return __ret;
  45018 }
  45019 #else
  45020 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpminnm_f16(float16x4_t __p0, float16x4_t __p1) {
  45021   float16x4_t __ret;
  45022   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45023   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  45024   __ret = (float16x4_t) __builtin_neon_vpminnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8);
  45025   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  45026   return __ret;
  45027 }
  45028 #endif
  45029 
  45030 #ifdef __LITTLE_ENDIAN__
  45031 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndiq_f16(float16x8_t __p0) {
  45032   float16x8_t __ret;
  45033   __ret = (float16x8_t) __builtin_neon_vrndiq_f16((int8x16_t)__p0, 40);
  45034   return __ret;
  45035 }
  45036 #else
  45037 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndiq_f16(float16x8_t __p0) {
  45038   float16x8_t __ret;
  45039   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45040   __ret = (float16x8_t) __builtin_neon_vrndiq_f16((int8x16_t)__rev0, 40);
  45041   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  45042   return __ret;
  45043 }
  45044 #endif
  45045 
  45046 #ifdef __LITTLE_ENDIAN__
  45047 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndi_f16(float16x4_t __p0) {
  45048   float16x4_t __ret;
  45049   __ret = (float16x4_t) __builtin_neon_vrndi_f16((int8x8_t)__p0, 8);
  45050   return __ret;
  45051 }
  45052 #else
  45053 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndi_f16(float16x4_t __p0) {
  45054   float16x4_t __ret;
  45055   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45056   __ret = (float16x4_t) __builtin_neon_vrndi_f16((int8x8_t)__rev0, 8);
  45057   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  45058   return __ret;
  45059 }
  45060 #endif
  45061 
  45062 #ifdef __LITTLE_ENDIAN__
  45063 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsqrtq_f16(float16x8_t __p0) {
  45064   float16x8_t __ret;
  45065   __ret = (float16x8_t) __builtin_neon_vsqrtq_f16((int8x16_t)__p0, 40);
  45066   return __ret;
  45067 }
  45068 #else
  45069 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsqrtq_f16(float16x8_t __p0) {
  45070   float16x8_t __ret;
  45071   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45072   __ret = (float16x8_t) __builtin_neon_vsqrtq_f16((int8x16_t)__rev0, 40);
  45073   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  45074   return __ret;
  45075 }
  45076 #endif
  45077 
  45078 #ifdef __LITTLE_ENDIAN__
  45079 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsqrt_f16(float16x4_t __p0) {
  45080   float16x4_t __ret;
  45081   __ret = (float16x4_t) __builtin_neon_vsqrt_f16((int8x8_t)__p0, 8);
  45082   return __ret;
  45083 }
  45084 #else
  45085 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsqrt_f16(float16x4_t __p0) {
  45086   float16x4_t __ret;
  45087   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45088   __ret = (float16x4_t) __builtin_neon_vsqrt_f16((int8x8_t)__rev0, 8);
  45089   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  45090   return __ret;
  45091 }
  45092 #endif
  45093 
  45094 #ifdef __LITTLE_ENDIAN__
  45095 #define vsudotq_laneq_s32(__p0_270, __p1_270, __p2_270, __p3_270) __extension__ ({ \
  45096   int32x4_t __ret_270; \
  45097   int32x4_t __s0_270 = __p0_270; \
  45098   int8x16_t __s1_270 = __p1_270; \
  45099   uint8x16_t __s2_270 = __p2_270; \
  45100   __ret_270 = vusdotq_s32(__s0_270, (uint8x16_t)(splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_270), __p3_270)), __s1_270); \
  45101   __ret_270; \
  45102 })
  45103 #else
  45104 #define vsudotq_laneq_s32(__p0_271, __p1_271, __p2_271, __p3_271) __extension__ ({ \
  45105   int32x4_t __ret_271; \
  45106   int32x4_t __s0_271 = __p0_271; \
  45107   int8x16_t __s1_271 = __p1_271; \
  45108   uint8x16_t __s2_271 = __p2_271; \
  45109   int32x4_t __rev0_271;  __rev0_271 = __builtin_shufflevector(__s0_271, __s0_271, 3, 2, 1, 0); \
  45110   int8x16_t __rev1_271;  __rev1_271 = __builtin_shufflevector(__s1_271, __s1_271, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  45111   uint8x16_t __rev2_271;  __rev2_271 = __builtin_shufflevector(__s2_271, __s2_271, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  45112   __ret_271 = __noswap_vusdotq_s32(__rev0_271, (uint8x16_t)(__noswap_splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_271), __p3_271)), __rev1_271); \
  45113   __ret_271 = __builtin_shufflevector(__ret_271, __ret_271, 3, 2, 1, 0); \
  45114   __ret_271; \
  45115 })
  45116 #endif
  45117 
  45118 #ifdef __LITTLE_ENDIAN__
  45119 #define vsudot_laneq_s32(__p0_272, __p1_272, __p2_272, __p3_272) __extension__ ({ \
  45120   int32x2_t __ret_272; \
  45121   int32x2_t __s0_272 = __p0_272; \
  45122   int8x8_t __s1_272 = __p1_272; \
  45123   uint8x16_t __s2_272 = __p2_272; \
  45124   __ret_272 = vusdot_s32(__s0_272, (uint8x8_t)(splat_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_272), __p3_272)), __s1_272); \
  45125   __ret_272; \
  45126 })
  45127 #else
  45128 #define vsudot_laneq_s32(__p0_273, __p1_273, __p2_273, __p3_273) __extension__ ({ \
  45129   int32x2_t __ret_273; \
  45130   int32x2_t __s0_273 = __p0_273; \
  45131   int8x8_t __s1_273 = __p1_273; \
  45132   uint8x16_t __s2_273 = __p2_273; \
  45133   int32x2_t __rev0_273;  __rev0_273 = __builtin_shufflevector(__s0_273, __s0_273, 1, 0); \
  45134   int8x8_t __rev1_273;  __rev1_273 = __builtin_shufflevector(__s1_273, __s1_273, 7, 6, 5, 4, 3, 2, 1, 0); \
  45135   uint8x16_t __rev2_273;  __rev2_273 = __builtin_shufflevector(__s2_273, __s2_273, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  45136   __ret_273 = __noswap_vusdot_s32(__rev0_273, (uint8x8_t)(__noswap_splat_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_273), __p3_273)), __rev1_273); \
  45137   __ret_273 = __builtin_shufflevector(__ret_273, __ret_273, 1, 0); \
  45138   __ret_273; \
  45139 })
  45140 #endif
  45141 
  45142 #ifdef __LITTLE_ENDIAN__
  45143 #define vusdotq_laneq_s32(__p0_274, __p1_274, __p2_274, __p3_274) __extension__ ({ \
  45144   int32x4_t __ret_274; \
  45145   int32x4_t __s0_274 = __p0_274; \
  45146   uint8x16_t __s1_274 = __p1_274; \
  45147   int8x16_t __s2_274 = __p2_274; \
  45148   __ret_274 = vusdotq_s32(__s0_274, __s1_274, (int8x16_t)(splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_274), __p3_274))); \
  45149   __ret_274; \
  45150 })
  45151 #else
  45152 #define vusdotq_laneq_s32(__p0_275, __p1_275, __p2_275, __p3_275) __extension__ ({ \
  45153   int32x4_t __ret_275; \
  45154   int32x4_t __s0_275 = __p0_275; \
  45155   uint8x16_t __s1_275 = __p1_275; \
  45156   int8x16_t __s2_275 = __p2_275; \
  45157   int32x4_t __rev0_275;  __rev0_275 = __builtin_shufflevector(__s0_275, __s0_275, 3, 2, 1, 0); \
  45158   uint8x16_t __rev1_275;  __rev1_275 = __builtin_shufflevector(__s1_275, __s1_275, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  45159   int8x16_t __rev2_275;  __rev2_275 = __builtin_shufflevector(__s2_275, __s2_275, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  45160   __ret_275 = __noswap_vusdotq_s32(__rev0_275, __rev1_275, (int8x16_t)(__noswap_splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_275), __p3_275))); \
  45161   __ret_275 = __builtin_shufflevector(__ret_275, __ret_275, 3, 2, 1, 0); \
  45162   __ret_275; \
  45163 })
  45164 #endif
  45165 
  45166 #ifdef __LITTLE_ENDIAN__
  45167 #define vusdot_laneq_s32(__p0_276, __p1_276, __p2_276, __p3_276) __extension__ ({ \
  45168   int32x2_t __ret_276; \
  45169   int32x2_t __s0_276 = __p0_276; \
  45170   uint8x8_t __s1_276 = __p1_276; \
  45171   int8x16_t __s2_276 = __p2_276; \
  45172   __ret_276 = vusdot_s32(__s0_276, __s1_276, (int8x8_t)(splat_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_276), __p3_276))); \
  45173   __ret_276; \
  45174 })
  45175 #else
  45176 #define vusdot_laneq_s32(__p0_277, __p1_277, __p2_277, __p3_277) __extension__ ({ \
  45177   int32x2_t __ret_277; \
  45178   int32x2_t __s0_277 = __p0_277; \
  45179   uint8x8_t __s1_277 = __p1_277; \
  45180   int8x16_t __s2_277 = __p2_277; \
  45181   int32x2_t __rev0_277;  __rev0_277 = __builtin_shufflevector(__s0_277, __s0_277, 1, 0); \
  45182   uint8x8_t __rev1_277;  __rev1_277 = __builtin_shufflevector(__s1_277, __s1_277, 7, 6, 5, 4, 3, 2, 1, 0); \
  45183   int8x16_t __rev2_277;  __rev2_277 = __builtin_shufflevector(__s2_277, __s2_277, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  45184   __ret_277 = __noswap_vusdot_s32(__rev0_277, __rev1_277, (int8x8_t)(__noswap_splat_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_277), __p3_277))); \
  45185   __ret_277 = __builtin_shufflevector(__ret_277, __ret_277, 1, 0); \
  45186   __ret_277; \
  45187 })
  45188 #endif
  45189 
  45190 #ifdef __LITTLE_ENDIAN__
  45191 __ai __attribute__((target("neon"))) float64x2_t vabdq_f64(float64x2_t __p0, float64x2_t __p1) {
  45192   float64x2_t __ret;
  45193   __ret = (float64x2_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  45194   return __ret;
  45195 }
  45196 #else
  45197 __ai __attribute__((target("neon"))) float64x2_t vabdq_f64(float64x2_t __p0, float64x2_t __p1) {
  45198   float64x2_t __ret;
  45199   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45200   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45201   __ret = (float64x2_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  45202   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45203   return __ret;
  45204 }
  45205 #endif
  45206 
  45207 __ai __attribute__((target("neon"))) float64x1_t vabd_f64(float64x1_t __p0, float64x1_t __p1) {
  45208   float64x1_t __ret;
  45209   __ret = (float64x1_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  45210   return __ret;
  45211 }
  45212 __ai __attribute__((target("neon"))) float64_t vabdd_f64(float64_t __p0, float64_t __p1) {
  45213   float64_t __ret;
  45214   __ret = (float64_t) __builtin_neon_vabdd_f64(__p0, __p1);
  45215   return __ret;
  45216 }
  45217 __ai __attribute__((target("neon"))) float32_t vabds_f32(float32_t __p0, float32_t __p1) {
  45218   float32_t __ret;
  45219   __ret = (float32_t) __builtin_neon_vabds_f32(__p0, __p1);
  45220   return __ret;
  45221 }
  45222 #ifdef __LITTLE_ENDIAN__
  45223 __ai __attribute__((target("neon"))) float64x2_t vabsq_f64(float64x2_t __p0) {
  45224   float64x2_t __ret;
  45225   __ret = (float64x2_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 42);
  45226   return __ret;
  45227 }
  45228 #else
  45229 __ai __attribute__((target("neon"))) float64x2_t vabsq_f64(float64x2_t __p0) {
  45230   float64x2_t __ret;
  45231   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45232   __ret = (float64x2_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 42);
  45233   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45234   return __ret;
  45235 }
  45236 #endif
  45237 
  45238 #ifdef __LITTLE_ENDIAN__
  45239 __ai __attribute__((target("neon"))) int64x2_t vabsq_s64(int64x2_t __p0) {
  45240   int64x2_t __ret;
  45241   __ret = (int64x2_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 35);
  45242   return __ret;
  45243 }
  45244 #else
  45245 __ai __attribute__((target("neon"))) int64x2_t vabsq_s64(int64x2_t __p0) {
  45246   int64x2_t __ret;
  45247   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45248   __ret = (int64x2_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 35);
  45249   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45250   return __ret;
  45251 }
  45252 #endif
  45253 
  45254 __ai __attribute__((target("neon"))) float64x1_t vabs_f64(float64x1_t __p0) {
  45255   float64x1_t __ret;
  45256   __ret = (float64x1_t) __builtin_neon_vabs_v((int8x8_t)__p0, 10);
  45257   return __ret;
  45258 }
  45259 __ai __attribute__((target("neon"))) int64x1_t vabs_s64(int64x1_t __p0) {
  45260   int64x1_t __ret;
  45261   __ret = (int64x1_t) __builtin_neon_vabs_v((int8x8_t)__p0, 3);
  45262   return __ret;
  45263 }
  45264 __ai __attribute__((target("neon"))) int64_t vabsd_s64(int64_t __p0) {
  45265   int64_t __ret;
  45266   __ret = (int64_t) __builtin_neon_vabsd_s64(__p0);
  45267   return __ret;
  45268 }
  45269 #ifdef __LITTLE_ENDIAN__
  45270 __ai __attribute__((target("neon"))) float64x2_t vaddq_f64(float64x2_t __p0, float64x2_t __p1) {
  45271   float64x2_t __ret;
  45272   __ret = __p0 + __p1;
  45273   return __ret;
  45274 }
  45275 #else
  45276 __ai __attribute__((target("neon"))) float64x2_t vaddq_f64(float64x2_t __p0, float64x2_t __p1) {
  45277   float64x2_t __ret;
  45278   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45279   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45280   __ret = __rev0 + __rev1;
  45281   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45282   return __ret;
  45283 }
  45284 #endif
  45285 
  45286 __ai __attribute__((target("neon"))) float64x1_t vadd_f64(float64x1_t __p0, float64x1_t __p1) {
  45287   float64x1_t __ret;
  45288   __ret = __p0 + __p1;
  45289   return __ret;
  45290 }
  45291 __ai __attribute__((target("neon"))) uint64_t vaddd_u64(uint64_t __p0, uint64_t __p1) {
  45292   uint64_t __ret;
  45293   __ret = (uint64_t) __builtin_neon_vaddd_u64(__p0, __p1);
  45294   return __ret;
  45295 }
  45296 __ai __attribute__((target("neon"))) int64_t vaddd_s64(int64_t __p0, int64_t __p1) {
  45297   int64_t __ret;
  45298   __ret = (int64_t) __builtin_neon_vaddd_s64(__p0, __p1);
  45299   return __ret;
  45300 }
  45301 __ai __attribute__((target("neon"))) poly128_t vaddq_p128(poly128_t __p0, poly128_t __p1) {
  45302   poly128_t __ret;
  45303   __ret = (poly128_t) __builtin_neon_vaddq_p128(__p0, __p1);
  45304   return __ret;
  45305 }
  45306 #ifdef __LITTLE_ENDIAN__
  45307 __ai __attribute__((target("neon"))) uint16x8_t vaddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  45308   uint16x8_t __ret;
  45309   __ret = vcombine_u16(__p0, vaddhn_u32(__p1, __p2));
  45310   return __ret;
  45311 }
  45312 #else
  45313 __ai __attribute__((target("neon"))) uint16x8_t vaddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  45314   uint16x8_t __ret;
  45315   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45316   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  45317   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  45318   __ret = __noswap_vcombine_u16(__rev0, __noswap_vaddhn_u32(__rev1, __rev2));
  45319   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  45320   return __ret;
  45321 }
  45322 #endif
  45323 
  45324 #ifdef __LITTLE_ENDIAN__
  45325 __ai __attribute__((target("neon"))) uint32x4_t vaddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  45326   uint32x4_t __ret;
  45327   __ret = vcombine_u32(__p0, vaddhn_u64(__p1, __p2));
  45328   return __ret;
  45329 }
  45330 #else
  45331 __ai __attribute__((target("neon"))) uint32x4_t vaddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  45332   uint32x4_t __ret;
  45333   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45334   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45335   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  45336   __ret = __noswap_vcombine_u32(__rev0, __noswap_vaddhn_u64(__rev1, __rev2));
  45337   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  45338   return __ret;
  45339 }
  45340 #endif
  45341 
  45342 #ifdef __LITTLE_ENDIAN__
  45343 __ai __attribute__((target("neon"))) uint8x16_t vaddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  45344   uint8x16_t __ret;
  45345   __ret = vcombine_u8(__p0, vaddhn_u16(__p1, __p2));
  45346   return __ret;
  45347 }
  45348 #else
  45349 __ai __attribute__((target("neon"))) uint8x16_t vaddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  45350   uint8x16_t __ret;
  45351   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45352   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  45353   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  45354   __ret = __noswap_vcombine_u8(__rev0, __noswap_vaddhn_u16(__rev1, __rev2));
  45355   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  45356   return __ret;
  45357 }
  45358 #endif
  45359 
  45360 #ifdef __LITTLE_ENDIAN__
  45361 __ai __attribute__((target("neon"))) int16x8_t vaddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  45362   int16x8_t __ret;
  45363   __ret = vcombine_s16(__p0, vaddhn_s32(__p1, __p2));
  45364   return __ret;
  45365 }
  45366 #else
  45367 __ai __attribute__((target("neon"))) int16x8_t vaddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  45368   int16x8_t __ret;
  45369   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45370   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  45371   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  45372   __ret = __noswap_vcombine_s16(__rev0, __noswap_vaddhn_s32(__rev1, __rev2));
  45373   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  45374   return __ret;
  45375 }
  45376 #endif
  45377 
  45378 #ifdef __LITTLE_ENDIAN__
  45379 __ai __attribute__((target("neon"))) int32x4_t vaddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  45380   int32x4_t __ret;
  45381   __ret = vcombine_s32(__p0, vaddhn_s64(__p1, __p2));
  45382   return __ret;
  45383 }
  45384 #else
  45385 __ai __attribute__((target("neon"))) int32x4_t vaddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  45386   int32x4_t __ret;
  45387   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45388   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45389   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  45390   __ret = __noswap_vcombine_s32(__rev0, __noswap_vaddhn_s64(__rev1, __rev2));
  45391   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  45392   return __ret;
  45393 }
  45394 #endif
  45395 
  45396 #ifdef __LITTLE_ENDIAN__
  45397 __ai __attribute__((target("neon"))) int8x16_t vaddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  45398   int8x16_t __ret;
  45399   __ret = vcombine_s8(__p0, vaddhn_s16(__p1, __p2));
  45400   return __ret;
  45401 }
  45402 #else
  45403 __ai __attribute__((target("neon"))) int8x16_t vaddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  45404   int8x16_t __ret;
  45405   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45406   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  45407   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  45408   __ret = __noswap_vcombine_s8(__rev0, __noswap_vaddhn_s16(__rev1, __rev2));
  45409   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  45410   return __ret;
  45411 }
  45412 #endif
  45413 
  45414 #ifdef __LITTLE_ENDIAN__
  45415 __ai __attribute__((target("neon"))) uint16_t vaddlvq_u8(uint8x16_t __p0) {
  45416   uint16_t __ret;
  45417   __ret = (uint16_t) __builtin_neon_vaddlvq_u8(__p0);
  45418   return __ret;
  45419 }
  45420 #else
  45421 __ai __attribute__((target("neon"))) uint16_t vaddlvq_u8(uint8x16_t __p0) {
  45422   uint16_t __ret;
  45423   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  45424   __ret = (uint16_t) __builtin_neon_vaddlvq_u8(__rev0);
  45425   return __ret;
  45426 }
  45427 #endif
  45428 
  45429 #ifdef __LITTLE_ENDIAN__
  45430 __ai __attribute__((target("neon"))) uint64_t vaddlvq_u32(uint32x4_t __p0) {
  45431   uint64_t __ret;
  45432   __ret = (uint64_t) __builtin_neon_vaddlvq_u32(__p0);
  45433   return __ret;
  45434 }
  45435 #else
  45436 __ai __attribute__((target("neon"))) uint64_t vaddlvq_u32(uint32x4_t __p0) {
  45437   uint64_t __ret;
  45438   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45439   __ret = (uint64_t) __builtin_neon_vaddlvq_u32(__rev0);
  45440   return __ret;
  45441 }
  45442 #endif
  45443 
  45444 #ifdef __LITTLE_ENDIAN__
  45445 __ai __attribute__((target("neon"))) uint32_t vaddlvq_u16(uint16x8_t __p0) {
  45446   uint32_t __ret;
  45447   __ret = (uint32_t) __builtin_neon_vaddlvq_u16(__p0);
  45448   return __ret;
  45449 }
  45450 #else
  45451 __ai __attribute__((target("neon"))) uint32_t vaddlvq_u16(uint16x8_t __p0) {
  45452   uint32_t __ret;
  45453   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45454   __ret = (uint32_t) __builtin_neon_vaddlvq_u16(__rev0);
  45455   return __ret;
  45456 }
  45457 #endif
  45458 
  45459 #ifdef __LITTLE_ENDIAN__
  45460 __ai __attribute__((target("neon"))) int16_t vaddlvq_s8(int8x16_t __p0) {
  45461   int16_t __ret;
  45462   __ret = (int16_t) __builtin_neon_vaddlvq_s8(__p0);
  45463   return __ret;
  45464 }
  45465 #else
  45466 __ai __attribute__((target("neon"))) int16_t vaddlvq_s8(int8x16_t __p0) {
  45467   int16_t __ret;
  45468   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  45469   __ret = (int16_t) __builtin_neon_vaddlvq_s8(__rev0);
  45470   return __ret;
  45471 }
  45472 #endif
  45473 
  45474 #ifdef __LITTLE_ENDIAN__
  45475 __ai __attribute__((target("neon"))) int64_t vaddlvq_s32(int32x4_t __p0) {
  45476   int64_t __ret;
  45477   __ret = (int64_t) __builtin_neon_vaddlvq_s32(__p0);
  45478   return __ret;
  45479 }
  45480 #else
  45481 __ai __attribute__((target("neon"))) int64_t vaddlvq_s32(int32x4_t __p0) {
  45482   int64_t __ret;
  45483   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45484   __ret = (int64_t) __builtin_neon_vaddlvq_s32(__rev0);
  45485   return __ret;
  45486 }
  45487 #endif
  45488 
  45489 #ifdef __LITTLE_ENDIAN__
  45490 __ai __attribute__((target("neon"))) int32_t vaddlvq_s16(int16x8_t __p0) {
  45491   int32_t __ret;
  45492   __ret = (int32_t) __builtin_neon_vaddlvq_s16(__p0);
  45493   return __ret;
  45494 }
  45495 #else
  45496 __ai __attribute__((target("neon"))) int32_t vaddlvq_s16(int16x8_t __p0) {
  45497   int32_t __ret;
  45498   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45499   __ret = (int32_t) __builtin_neon_vaddlvq_s16(__rev0);
  45500   return __ret;
  45501 }
  45502 #endif
  45503 
  45504 #ifdef __LITTLE_ENDIAN__
  45505 __ai __attribute__((target("neon"))) uint16_t vaddlv_u8(uint8x8_t __p0) {
  45506   uint16_t __ret;
  45507   __ret = (uint16_t) __builtin_neon_vaddlv_u8(__p0);
  45508   return __ret;
  45509 }
  45510 #else
  45511 __ai __attribute__((target("neon"))) uint16_t vaddlv_u8(uint8x8_t __p0) {
  45512   uint16_t __ret;
  45513   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45514   __ret = (uint16_t) __builtin_neon_vaddlv_u8(__rev0);
  45515   return __ret;
  45516 }
  45517 #endif
  45518 
  45519 #ifdef __LITTLE_ENDIAN__
  45520 __ai __attribute__((target("neon"))) uint64_t vaddlv_u32(uint32x2_t __p0) {
  45521   uint64_t __ret;
  45522   __ret = (uint64_t) __builtin_neon_vaddlv_u32(__p0);
  45523   return __ret;
  45524 }
  45525 #else
  45526 __ai __attribute__((target("neon"))) uint64_t vaddlv_u32(uint32x2_t __p0) {
  45527   uint64_t __ret;
  45528   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45529   __ret = (uint64_t) __builtin_neon_vaddlv_u32(__rev0);
  45530   return __ret;
  45531 }
  45532 #endif
  45533 
  45534 #ifdef __LITTLE_ENDIAN__
  45535 __ai __attribute__((target("neon"))) uint32_t vaddlv_u16(uint16x4_t __p0) {
  45536   uint32_t __ret;
  45537   __ret = (uint32_t) __builtin_neon_vaddlv_u16(__p0);
  45538   return __ret;
  45539 }
  45540 #else
  45541 __ai __attribute__((target("neon"))) uint32_t vaddlv_u16(uint16x4_t __p0) {
  45542   uint32_t __ret;
  45543   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45544   __ret = (uint32_t) __builtin_neon_vaddlv_u16(__rev0);
  45545   return __ret;
  45546 }
  45547 #endif
  45548 
  45549 #ifdef __LITTLE_ENDIAN__
  45550 __ai __attribute__((target("neon"))) int16_t vaddlv_s8(int8x8_t __p0) {
  45551   int16_t __ret;
  45552   __ret = (int16_t) __builtin_neon_vaddlv_s8(__p0);
  45553   return __ret;
  45554 }
  45555 #else
  45556 __ai __attribute__((target("neon"))) int16_t vaddlv_s8(int8x8_t __p0) {
  45557   int16_t __ret;
  45558   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45559   __ret = (int16_t) __builtin_neon_vaddlv_s8(__rev0);
  45560   return __ret;
  45561 }
  45562 #endif
  45563 
  45564 #ifdef __LITTLE_ENDIAN__
  45565 __ai __attribute__((target("neon"))) int64_t vaddlv_s32(int32x2_t __p0) {
  45566   int64_t __ret;
  45567   __ret = (int64_t) __builtin_neon_vaddlv_s32(__p0);
  45568   return __ret;
  45569 }
  45570 #else
  45571 __ai __attribute__((target("neon"))) int64_t vaddlv_s32(int32x2_t __p0) {
  45572   int64_t __ret;
  45573   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45574   __ret = (int64_t) __builtin_neon_vaddlv_s32(__rev0);
  45575   return __ret;
  45576 }
  45577 #endif
  45578 
  45579 #ifdef __LITTLE_ENDIAN__
  45580 __ai __attribute__((target("neon"))) int32_t vaddlv_s16(int16x4_t __p0) {
  45581   int32_t __ret;
  45582   __ret = (int32_t) __builtin_neon_vaddlv_s16(__p0);
  45583   return __ret;
  45584 }
  45585 #else
  45586 __ai __attribute__((target("neon"))) int32_t vaddlv_s16(int16x4_t __p0) {
  45587   int32_t __ret;
  45588   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45589   __ret = (int32_t) __builtin_neon_vaddlv_s16(__rev0);
  45590   return __ret;
  45591 }
  45592 #endif
  45593 
  45594 #ifdef __LITTLE_ENDIAN__
  45595 __ai __attribute__((target("neon"))) uint8_t vaddvq_u8(uint8x16_t __p0) {
  45596   uint8_t __ret;
  45597   __ret = (uint8_t) __builtin_neon_vaddvq_u8(__p0);
  45598   return __ret;
  45599 }
  45600 #else
  45601 __ai __attribute__((target("neon"))) uint8_t vaddvq_u8(uint8x16_t __p0) {
  45602   uint8_t __ret;
  45603   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  45604   __ret = (uint8_t) __builtin_neon_vaddvq_u8(__rev0);
  45605   return __ret;
  45606 }
  45607 #endif
  45608 
  45609 #ifdef __LITTLE_ENDIAN__
  45610 __ai __attribute__((target("neon"))) uint32_t vaddvq_u32(uint32x4_t __p0) {
  45611   uint32_t __ret;
  45612   __ret = (uint32_t) __builtin_neon_vaddvq_u32(__p0);
  45613   return __ret;
  45614 }
  45615 #else
  45616 __ai __attribute__((target("neon"))) uint32_t vaddvq_u32(uint32x4_t __p0) {
  45617   uint32_t __ret;
  45618   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45619   __ret = (uint32_t) __builtin_neon_vaddvq_u32(__rev0);
  45620   return __ret;
  45621 }
  45622 #endif
  45623 
  45624 #ifdef __LITTLE_ENDIAN__
  45625 __ai __attribute__((target("neon"))) uint64_t vaddvq_u64(uint64x2_t __p0) {
  45626   uint64_t __ret;
  45627   __ret = (uint64_t) __builtin_neon_vaddvq_u64(__p0);
  45628   return __ret;
  45629 }
  45630 #else
  45631 __ai __attribute__((target("neon"))) uint64_t vaddvq_u64(uint64x2_t __p0) {
  45632   uint64_t __ret;
  45633   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45634   __ret = (uint64_t) __builtin_neon_vaddvq_u64(__rev0);
  45635   return __ret;
  45636 }
  45637 #endif
  45638 
  45639 #ifdef __LITTLE_ENDIAN__
  45640 __ai __attribute__((target("neon"))) uint16_t vaddvq_u16(uint16x8_t __p0) {
  45641   uint16_t __ret;
  45642   __ret = (uint16_t) __builtin_neon_vaddvq_u16(__p0);
  45643   return __ret;
  45644 }
  45645 #else
  45646 __ai __attribute__((target("neon"))) uint16_t vaddvq_u16(uint16x8_t __p0) {
  45647   uint16_t __ret;
  45648   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45649   __ret = (uint16_t) __builtin_neon_vaddvq_u16(__rev0);
  45650   return __ret;
  45651 }
  45652 #endif
  45653 
  45654 #ifdef __LITTLE_ENDIAN__
  45655 __ai __attribute__((target("neon"))) int8_t vaddvq_s8(int8x16_t __p0) {
  45656   int8_t __ret;
  45657   __ret = (int8_t) __builtin_neon_vaddvq_s8(__p0);
  45658   return __ret;
  45659 }
  45660 #else
  45661 __ai __attribute__((target("neon"))) int8_t vaddvq_s8(int8x16_t __p0) {
  45662   int8_t __ret;
  45663   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  45664   __ret = (int8_t) __builtin_neon_vaddvq_s8(__rev0);
  45665   return __ret;
  45666 }
  45667 #endif
  45668 
  45669 #ifdef __LITTLE_ENDIAN__
  45670 __ai __attribute__((target("neon"))) float64_t vaddvq_f64(float64x2_t __p0) {
  45671   float64_t __ret;
  45672   __ret = (float64_t) __builtin_neon_vaddvq_f64(__p0);
  45673   return __ret;
  45674 }
  45675 #else
  45676 __ai __attribute__((target("neon"))) float64_t vaddvq_f64(float64x2_t __p0) {
  45677   float64_t __ret;
  45678   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45679   __ret = (float64_t) __builtin_neon_vaddvq_f64(__rev0);
  45680   return __ret;
  45681 }
  45682 #endif
  45683 
  45684 #ifdef __LITTLE_ENDIAN__
  45685 __ai __attribute__((target("neon"))) float32_t vaddvq_f32(float32x4_t __p0) {
  45686   float32_t __ret;
  45687   __ret = (float32_t) __builtin_neon_vaddvq_f32(__p0);
  45688   return __ret;
  45689 }
  45690 #else
  45691 __ai __attribute__((target("neon"))) float32_t vaddvq_f32(float32x4_t __p0) {
  45692   float32_t __ret;
  45693   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45694   __ret = (float32_t) __builtin_neon_vaddvq_f32(__rev0);
  45695   return __ret;
  45696 }
  45697 #endif
  45698 
  45699 #ifdef __LITTLE_ENDIAN__
  45700 __ai __attribute__((target("neon"))) int32_t vaddvq_s32(int32x4_t __p0) {
  45701   int32_t __ret;
  45702   __ret = (int32_t) __builtin_neon_vaddvq_s32(__p0);
  45703   return __ret;
  45704 }
  45705 #else
  45706 __ai __attribute__((target("neon"))) int32_t vaddvq_s32(int32x4_t __p0) {
  45707   int32_t __ret;
  45708   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45709   __ret = (int32_t) __builtin_neon_vaddvq_s32(__rev0);
  45710   return __ret;
  45711 }
  45712 #endif
  45713 
  45714 #ifdef __LITTLE_ENDIAN__
  45715 __ai __attribute__((target("neon"))) int64_t vaddvq_s64(int64x2_t __p0) {
  45716   int64_t __ret;
  45717   __ret = (int64_t) __builtin_neon_vaddvq_s64(__p0);
  45718   return __ret;
  45719 }
  45720 #else
  45721 __ai __attribute__((target("neon"))) int64_t vaddvq_s64(int64x2_t __p0) {
  45722   int64_t __ret;
  45723   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45724   __ret = (int64_t) __builtin_neon_vaddvq_s64(__rev0);
  45725   return __ret;
  45726 }
  45727 #endif
  45728 
  45729 #ifdef __LITTLE_ENDIAN__
  45730 __ai __attribute__((target("neon"))) int16_t vaddvq_s16(int16x8_t __p0) {
  45731   int16_t __ret;
  45732   __ret = (int16_t) __builtin_neon_vaddvq_s16(__p0);
  45733   return __ret;
  45734 }
  45735 #else
  45736 __ai __attribute__((target("neon"))) int16_t vaddvq_s16(int16x8_t __p0) {
  45737   int16_t __ret;
  45738   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45739   __ret = (int16_t) __builtin_neon_vaddvq_s16(__rev0);
  45740   return __ret;
  45741 }
  45742 #endif
  45743 
  45744 #ifdef __LITTLE_ENDIAN__
  45745 __ai __attribute__((target("neon"))) uint8_t vaddv_u8(uint8x8_t __p0) {
  45746   uint8_t __ret;
  45747   __ret = (uint8_t) __builtin_neon_vaddv_u8(__p0);
  45748   return __ret;
  45749 }
  45750 #else
  45751 __ai __attribute__((target("neon"))) uint8_t vaddv_u8(uint8x8_t __p0) {
  45752   uint8_t __ret;
  45753   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45754   __ret = (uint8_t) __builtin_neon_vaddv_u8(__rev0);
  45755   return __ret;
  45756 }
  45757 #endif
  45758 
  45759 #ifdef __LITTLE_ENDIAN__
  45760 __ai __attribute__((target("neon"))) uint32_t vaddv_u32(uint32x2_t __p0) {
  45761   uint32_t __ret;
  45762   __ret = (uint32_t) __builtin_neon_vaddv_u32(__p0);
  45763   return __ret;
  45764 }
  45765 #else
  45766 __ai __attribute__((target("neon"))) uint32_t vaddv_u32(uint32x2_t __p0) {
  45767   uint32_t __ret;
  45768   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45769   __ret = (uint32_t) __builtin_neon_vaddv_u32(__rev0);
  45770   return __ret;
  45771 }
  45772 #endif
  45773 
  45774 #ifdef __LITTLE_ENDIAN__
  45775 __ai __attribute__((target("neon"))) uint16_t vaddv_u16(uint16x4_t __p0) {
  45776   uint16_t __ret;
  45777   __ret = (uint16_t) __builtin_neon_vaddv_u16(__p0);
  45778   return __ret;
  45779 }
  45780 #else
  45781 __ai __attribute__((target("neon"))) uint16_t vaddv_u16(uint16x4_t __p0) {
  45782   uint16_t __ret;
  45783   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45784   __ret = (uint16_t) __builtin_neon_vaddv_u16(__rev0);
  45785   return __ret;
  45786 }
  45787 #endif
  45788 
  45789 #ifdef __LITTLE_ENDIAN__
  45790 __ai __attribute__((target("neon"))) int8_t vaddv_s8(int8x8_t __p0) {
  45791   int8_t __ret;
  45792   __ret = (int8_t) __builtin_neon_vaddv_s8(__p0);
  45793   return __ret;
  45794 }
  45795 #else
  45796 __ai __attribute__((target("neon"))) int8_t vaddv_s8(int8x8_t __p0) {
  45797   int8_t __ret;
  45798   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  45799   __ret = (int8_t) __builtin_neon_vaddv_s8(__rev0);
  45800   return __ret;
  45801 }
  45802 #endif
  45803 
  45804 #ifdef __LITTLE_ENDIAN__
  45805 __ai __attribute__((target("neon"))) float32_t vaddv_f32(float32x2_t __p0) {
  45806   float32_t __ret;
  45807   __ret = (float32_t) __builtin_neon_vaddv_f32(__p0);
  45808   return __ret;
  45809 }
  45810 #else
  45811 __ai __attribute__((target("neon"))) float32_t vaddv_f32(float32x2_t __p0) {
  45812   float32_t __ret;
  45813   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45814   __ret = (float32_t) __builtin_neon_vaddv_f32(__rev0);
  45815   return __ret;
  45816 }
  45817 #endif
  45818 
  45819 #ifdef __LITTLE_ENDIAN__
  45820 __ai __attribute__((target("neon"))) int32_t vaddv_s32(int32x2_t __p0) {
  45821   int32_t __ret;
  45822   __ret = (int32_t) __builtin_neon_vaddv_s32(__p0);
  45823   return __ret;
  45824 }
  45825 #else
  45826 __ai __attribute__((target("neon"))) int32_t vaddv_s32(int32x2_t __p0) {
  45827   int32_t __ret;
  45828   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45829   __ret = (int32_t) __builtin_neon_vaddv_s32(__rev0);
  45830   return __ret;
  45831 }
  45832 #endif
  45833 
  45834 #ifdef __LITTLE_ENDIAN__
  45835 __ai __attribute__((target("neon"))) int16_t vaddv_s16(int16x4_t __p0) {
  45836   int16_t __ret;
  45837   __ret = (int16_t) __builtin_neon_vaddv_s16(__p0);
  45838   return __ret;
  45839 }
  45840 #else
  45841 __ai __attribute__((target("neon"))) int16_t vaddv_s16(int16x4_t __p0) {
  45842   int16_t __ret;
  45843   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  45844   __ret = (int16_t) __builtin_neon_vaddv_s16(__rev0);
  45845   return __ret;
  45846 }
  45847 #endif
  45848 
  45849 __ai __attribute__((target("neon"))) poly64x1_t vbsl_p64(uint64x1_t __p0, poly64x1_t __p1, poly64x1_t __p2) {
  45850   poly64x1_t __ret;
  45851   __ret = (poly64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 6);
  45852   return __ret;
  45853 }
  45854 #ifdef __LITTLE_ENDIAN__
  45855 __ai __attribute__((target("neon"))) poly64x2_t vbslq_p64(uint64x2_t __p0, poly64x2_t __p1, poly64x2_t __p2) {
  45856   poly64x2_t __ret;
  45857   __ret = (poly64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 38);
  45858   return __ret;
  45859 }
  45860 #else
  45861 __ai __attribute__((target("neon"))) poly64x2_t vbslq_p64(uint64x2_t __p0, poly64x2_t __p1, poly64x2_t __p2) {
  45862   poly64x2_t __ret;
  45863   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45864   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45865   poly64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  45866   __ret = (poly64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 38);
  45867   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45868   return __ret;
  45869 }
  45870 #endif
  45871 
  45872 #ifdef __LITTLE_ENDIAN__
  45873 __ai __attribute__((target("neon"))) float64x2_t vbslq_f64(uint64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  45874   float64x2_t __ret;
  45875   __ret = (float64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  45876   return __ret;
  45877 }
  45878 #else
  45879 __ai __attribute__((target("neon"))) float64x2_t vbslq_f64(uint64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  45880   float64x2_t __ret;
  45881   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45882   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45883   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  45884   __ret = (float64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42);
  45885   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45886   return __ret;
  45887 }
  45888 #endif
  45889 
  45890 __ai __attribute__((target("neon"))) float64x1_t vbsl_f64(uint64x1_t __p0, float64x1_t __p1, float64x1_t __p2) {
  45891   float64x1_t __ret;
  45892   __ret = (float64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 10);
  45893   return __ret;
  45894 }
  45895 #ifdef __LITTLE_ENDIAN__
  45896 __ai __attribute__((target("neon"))) uint64x2_t vcageq_f64(float64x2_t __p0, float64x2_t __p1) {
  45897   uint64x2_t __ret;
  45898   __ret = (uint64x2_t) __builtin_neon_vcageq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  45899   return __ret;
  45900 }
  45901 #else
  45902 __ai __attribute__((target("neon"))) uint64x2_t vcageq_f64(float64x2_t __p0, float64x2_t __p1) {
  45903   uint64x2_t __ret;
  45904   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45905   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45906   __ret = (uint64x2_t) __builtin_neon_vcageq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  45907   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45908   return __ret;
  45909 }
  45910 #endif
  45911 
  45912 __ai __attribute__((target("neon"))) uint64x1_t vcage_f64(float64x1_t __p0, float64x1_t __p1) {
  45913   uint64x1_t __ret;
  45914   __ret = (uint64x1_t) __builtin_neon_vcage_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  45915   return __ret;
  45916 }
  45917 __ai __attribute__((target("neon"))) uint64_t vcaged_f64(float64_t __p0, float64_t __p1) {
  45918   uint64_t __ret;
  45919   __ret = (uint64_t) __builtin_neon_vcaged_f64(__p0, __p1);
  45920   return __ret;
  45921 }
  45922 __ai __attribute__((target("neon"))) uint32_t vcages_f32(float32_t __p0, float32_t __p1) {
  45923   uint32_t __ret;
  45924   __ret = (uint32_t) __builtin_neon_vcages_f32(__p0, __p1);
  45925   return __ret;
  45926 }
  45927 #ifdef __LITTLE_ENDIAN__
  45928 __ai __attribute__((target("neon"))) uint64x2_t vcagtq_f64(float64x2_t __p0, float64x2_t __p1) {
  45929   uint64x2_t __ret;
  45930   __ret = (uint64x2_t) __builtin_neon_vcagtq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  45931   return __ret;
  45932 }
  45933 #else
  45934 __ai __attribute__((target("neon"))) uint64x2_t vcagtq_f64(float64x2_t __p0, float64x2_t __p1) {
  45935   uint64x2_t __ret;
  45936   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45937   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45938   __ret = (uint64x2_t) __builtin_neon_vcagtq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  45939   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45940   return __ret;
  45941 }
  45942 #endif
  45943 
  45944 __ai __attribute__((target("neon"))) uint64x1_t vcagt_f64(float64x1_t __p0, float64x1_t __p1) {
  45945   uint64x1_t __ret;
  45946   __ret = (uint64x1_t) __builtin_neon_vcagt_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  45947   return __ret;
  45948 }
  45949 __ai __attribute__((target("neon"))) uint64_t vcagtd_f64(float64_t __p0, float64_t __p1) {
  45950   uint64_t __ret;
  45951   __ret = (uint64_t) __builtin_neon_vcagtd_f64(__p0, __p1);
  45952   return __ret;
  45953 }
  45954 __ai __attribute__((target("neon"))) uint32_t vcagts_f32(float32_t __p0, float32_t __p1) {
  45955   uint32_t __ret;
  45956   __ret = (uint32_t) __builtin_neon_vcagts_f32(__p0, __p1);
  45957   return __ret;
  45958 }
  45959 #ifdef __LITTLE_ENDIAN__
  45960 __ai __attribute__((target("neon"))) uint64x2_t vcaleq_f64(float64x2_t __p0, float64x2_t __p1) {
  45961   uint64x2_t __ret;
  45962   __ret = (uint64x2_t) __builtin_neon_vcaleq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  45963   return __ret;
  45964 }
  45965 #else
  45966 __ai __attribute__((target("neon"))) uint64x2_t vcaleq_f64(float64x2_t __p0, float64x2_t __p1) {
  45967   uint64x2_t __ret;
  45968   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  45969   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  45970   __ret = (uint64x2_t) __builtin_neon_vcaleq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  45971   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  45972   return __ret;
  45973 }
  45974 #endif
  45975 
  45976 __ai __attribute__((target("neon"))) uint64x1_t vcale_f64(float64x1_t __p0, float64x1_t __p1) {
  45977   uint64x1_t __ret;
  45978   __ret = (uint64x1_t) __builtin_neon_vcale_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  45979   return __ret;
  45980 }
  45981 __ai __attribute__((target("neon"))) uint64_t vcaled_f64(float64_t __p0, float64_t __p1) {
  45982   uint64_t __ret;
  45983   __ret = (uint64_t) __builtin_neon_vcaled_f64(__p0, __p1);
  45984   return __ret;
  45985 }
  45986 __ai __attribute__((target("neon"))) uint32_t vcales_f32(float32_t __p0, float32_t __p1) {
  45987   uint32_t __ret;
  45988   __ret = (uint32_t) __builtin_neon_vcales_f32(__p0, __p1);
  45989   return __ret;
  45990 }
  45991 #ifdef __LITTLE_ENDIAN__
  45992 __ai __attribute__((target("neon"))) uint64x2_t vcaltq_f64(float64x2_t __p0, float64x2_t __p1) {
  45993   uint64x2_t __ret;
  45994   __ret = (uint64x2_t) __builtin_neon_vcaltq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  45995   return __ret;
  45996 }
  45997 #else
  45998 __ai __attribute__((target("neon"))) uint64x2_t vcaltq_f64(float64x2_t __p0, float64x2_t __p1) {
  45999   uint64x2_t __ret;
  46000   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46001   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46002   __ret = (uint64x2_t) __builtin_neon_vcaltq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  46003   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46004   return __ret;
  46005 }
  46006 #endif
  46007 
  46008 __ai __attribute__((target("neon"))) uint64x1_t vcalt_f64(float64x1_t __p0, float64x1_t __p1) {
  46009   uint64x1_t __ret;
  46010   __ret = (uint64x1_t) __builtin_neon_vcalt_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  46011   return __ret;
  46012 }
  46013 __ai __attribute__((target("neon"))) uint64_t vcaltd_f64(float64_t __p0, float64_t __p1) {
  46014   uint64_t __ret;
  46015   __ret = (uint64_t) __builtin_neon_vcaltd_f64(__p0, __p1);
  46016   return __ret;
  46017 }
  46018 __ai __attribute__((target("neon"))) uint32_t vcalts_f32(float32_t __p0, float32_t __p1) {
  46019   uint32_t __ret;
  46020   __ret = (uint32_t) __builtin_neon_vcalts_f32(__p0, __p1);
  46021   return __ret;
  46022 }
  46023 __ai __attribute__((target("neon"))) uint64x1_t vceq_p64(poly64x1_t __p0, poly64x1_t __p1) {
  46024   uint64x1_t __ret;
  46025   __ret = (uint64x1_t)(__p0 == __p1);
  46026   return __ret;
  46027 }
  46028 #ifdef __LITTLE_ENDIAN__
  46029 __ai __attribute__((target("neon"))) uint64x2_t vceqq_p64(poly64x2_t __p0, poly64x2_t __p1) {
  46030   uint64x2_t __ret;
  46031   __ret = (uint64x2_t)(__p0 == __p1);
  46032   return __ret;
  46033 }
  46034 #else
  46035 __ai __attribute__((target("neon"))) uint64x2_t vceqq_p64(poly64x2_t __p0, poly64x2_t __p1) {
  46036   uint64x2_t __ret;
  46037   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46038   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46039   __ret = (uint64x2_t)(__rev0 == __rev1);
  46040   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46041   return __ret;
  46042 }
  46043 #endif
  46044 
  46045 #ifdef __LITTLE_ENDIAN__
  46046 __ai __attribute__((target("neon"))) uint64x2_t vceqq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  46047   uint64x2_t __ret;
  46048   __ret = (uint64x2_t)(__p0 == __p1);
  46049   return __ret;
  46050 }
  46051 #else
  46052 __ai __attribute__((target("neon"))) uint64x2_t vceqq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  46053   uint64x2_t __ret;
  46054   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46055   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46056   __ret = (uint64x2_t)(__rev0 == __rev1);
  46057   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46058   return __ret;
  46059 }
  46060 #endif
  46061 
  46062 #ifdef __LITTLE_ENDIAN__
  46063 __ai __attribute__((target("neon"))) uint64x2_t vceqq_f64(float64x2_t __p0, float64x2_t __p1) {
  46064   uint64x2_t __ret;
  46065   __ret = (uint64x2_t)(__p0 == __p1);
  46066   return __ret;
  46067 }
  46068 #else
  46069 __ai __attribute__((target("neon"))) uint64x2_t vceqq_f64(float64x2_t __p0, float64x2_t __p1) {
  46070   uint64x2_t __ret;
  46071   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46072   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46073   __ret = (uint64x2_t)(__rev0 == __rev1);
  46074   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46075   return __ret;
  46076 }
  46077 #endif
  46078 
  46079 #ifdef __LITTLE_ENDIAN__
  46080 __ai __attribute__((target("neon"))) uint64x2_t vceqq_s64(int64x2_t __p0, int64x2_t __p1) {
  46081   uint64x2_t __ret;
  46082   __ret = (uint64x2_t)(__p0 == __p1);
  46083   return __ret;
  46084 }
  46085 #else
  46086 __ai __attribute__((target("neon"))) uint64x2_t vceqq_s64(int64x2_t __p0, int64x2_t __p1) {
  46087   uint64x2_t __ret;
  46088   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46089   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46090   __ret = (uint64x2_t)(__rev0 == __rev1);
  46091   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46092   return __ret;
  46093 }
  46094 #endif
  46095 
  46096 __ai __attribute__((target("neon"))) uint64x1_t vceq_u64(uint64x1_t __p0, uint64x1_t __p1) {
  46097   uint64x1_t __ret;
  46098   __ret = (uint64x1_t)(__p0 == __p1);
  46099   return __ret;
  46100 }
  46101 __ai __attribute__((target("neon"))) uint64x1_t vceq_f64(float64x1_t __p0, float64x1_t __p1) {
  46102   uint64x1_t __ret;
  46103   __ret = (uint64x1_t)(__p0 == __p1);
  46104   return __ret;
  46105 }
  46106 __ai __attribute__((target("neon"))) uint64x1_t vceq_s64(int64x1_t __p0, int64x1_t __p1) {
  46107   uint64x1_t __ret;
  46108   __ret = (uint64x1_t)(__p0 == __p1);
  46109   return __ret;
  46110 }
  46111 __ai __attribute__((target("neon"))) uint64_t vceqd_u64(uint64_t __p0, uint64_t __p1) {
  46112   uint64_t __ret;
  46113   __ret = (uint64_t) __builtin_neon_vceqd_u64(__p0, __p1);
  46114   return __ret;
  46115 }
  46116 __ai __attribute__((target("neon"))) uint64_t vceqd_s64(int64_t __p0, int64_t __p1) {
  46117   uint64_t __ret;
  46118   __ret = (uint64_t) __builtin_neon_vceqd_s64(__p0, __p1);
  46119   return __ret;
  46120 }
  46121 __ai __attribute__((target("neon"))) uint64_t vceqd_f64(float64_t __p0, float64_t __p1) {
  46122   uint64_t __ret;
  46123   __ret = (uint64_t) __builtin_neon_vceqd_f64(__p0, __p1);
  46124   return __ret;
  46125 }
  46126 __ai __attribute__((target("neon"))) uint32_t vceqs_f32(float32_t __p0, float32_t __p1) {
  46127   uint32_t __ret;
  46128   __ret = (uint32_t) __builtin_neon_vceqs_f32(__p0, __p1);
  46129   return __ret;
  46130 }
  46131 #ifdef __LITTLE_ENDIAN__
  46132 __ai __attribute__((target("neon"))) uint8x8_t vceqz_p8(poly8x8_t __p0) {
  46133   uint8x8_t __ret;
  46134   __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 16);
  46135   return __ret;
  46136 }
  46137 #else
  46138 __ai __attribute__((target("neon"))) uint8x8_t vceqz_p8(poly8x8_t __p0) {
  46139   uint8x8_t __ret;
  46140   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46141   __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 16);
  46142   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46143   return __ret;
  46144 }
  46145 #endif
  46146 
  46147 __ai __attribute__((target("neon"))) uint64x1_t vceqz_p64(poly64x1_t __p0) {
  46148   uint64x1_t __ret;
  46149   __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19);
  46150   return __ret;
  46151 }
  46152 #ifdef __LITTLE_ENDIAN__
  46153 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_p8(poly8x16_t __p0) {
  46154   uint8x16_t __ret;
  46155   __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 48);
  46156   return __ret;
  46157 }
  46158 #else
  46159 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_p8(poly8x16_t __p0) {
  46160   uint8x16_t __ret;
  46161   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46162   __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 48);
  46163   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46164   return __ret;
  46165 }
  46166 #endif
  46167 
  46168 #ifdef __LITTLE_ENDIAN__
  46169 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_p64(poly64x2_t __p0) {
  46170   uint64x2_t __ret;
  46171   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51);
  46172   return __ret;
  46173 }
  46174 #else
  46175 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_p64(poly64x2_t __p0) {
  46176   uint64x2_t __ret;
  46177   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46178   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51);
  46179   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46180   return __ret;
  46181 }
  46182 #endif
  46183 
  46184 #ifdef __LITTLE_ENDIAN__
  46185 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_u8(uint8x16_t __p0) {
  46186   uint8x16_t __ret;
  46187   __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 48);
  46188   return __ret;
  46189 }
  46190 #else
  46191 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_u8(uint8x16_t __p0) {
  46192   uint8x16_t __ret;
  46193   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46194   __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 48);
  46195   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46196   return __ret;
  46197 }
  46198 #endif
  46199 
  46200 #ifdef __LITTLE_ENDIAN__
  46201 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_u32(uint32x4_t __p0) {
  46202   uint32x4_t __ret;
  46203   __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 50);
  46204   return __ret;
  46205 }
  46206 #else
  46207 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_u32(uint32x4_t __p0) {
  46208   uint32x4_t __ret;
  46209   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46210   __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 50);
  46211   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46212   return __ret;
  46213 }
  46214 #endif
  46215 
  46216 #ifdef __LITTLE_ENDIAN__
  46217 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_u64(uint64x2_t __p0) {
  46218   uint64x2_t __ret;
  46219   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51);
  46220   return __ret;
  46221 }
  46222 #else
  46223 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_u64(uint64x2_t __p0) {
  46224   uint64x2_t __ret;
  46225   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46226   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51);
  46227   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46228   return __ret;
  46229 }
  46230 #endif
  46231 
  46232 #ifdef __LITTLE_ENDIAN__
  46233 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_u16(uint16x8_t __p0) {
  46234   uint16x8_t __ret;
  46235   __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 49);
  46236   return __ret;
  46237 }
  46238 #else
  46239 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_u16(uint16x8_t __p0) {
  46240   uint16x8_t __ret;
  46241   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46242   __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 49);
  46243   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46244   return __ret;
  46245 }
  46246 #endif
  46247 
  46248 #ifdef __LITTLE_ENDIAN__
  46249 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_s8(int8x16_t __p0) {
  46250   uint8x16_t __ret;
  46251   __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 48);
  46252   return __ret;
  46253 }
  46254 #else
  46255 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_s8(int8x16_t __p0) {
  46256   uint8x16_t __ret;
  46257   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46258   __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 48);
  46259   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46260   return __ret;
  46261 }
  46262 #endif
  46263 
  46264 #ifdef __LITTLE_ENDIAN__
  46265 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_f64(float64x2_t __p0) {
  46266   uint64x2_t __ret;
  46267   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51);
  46268   return __ret;
  46269 }
  46270 #else
  46271 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_f64(float64x2_t __p0) {
  46272   uint64x2_t __ret;
  46273   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46274   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51);
  46275   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46276   return __ret;
  46277 }
  46278 #endif
  46279 
  46280 #ifdef __LITTLE_ENDIAN__
  46281 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_f32(float32x4_t __p0) {
  46282   uint32x4_t __ret;
  46283   __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 50);
  46284   return __ret;
  46285 }
  46286 #else
  46287 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_f32(float32x4_t __p0) {
  46288   uint32x4_t __ret;
  46289   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46290   __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 50);
  46291   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46292   return __ret;
  46293 }
  46294 #endif
  46295 
  46296 #ifdef __LITTLE_ENDIAN__
  46297 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_s32(int32x4_t __p0) {
  46298   uint32x4_t __ret;
  46299   __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 50);
  46300   return __ret;
  46301 }
  46302 #else
  46303 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_s32(int32x4_t __p0) {
  46304   uint32x4_t __ret;
  46305   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46306   __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 50);
  46307   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46308   return __ret;
  46309 }
  46310 #endif
  46311 
  46312 #ifdef __LITTLE_ENDIAN__
  46313 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_s64(int64x2_t __p0) {
  46314   uint64x2_t __ret;
  46315   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51);
  46316   return __ret;
  46317 }
  46318 #else
  46319 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_s64(int64x2_t __p0) {
  46320   uint64x2_t __ret;
  46321   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46322   __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51);
  46323   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46324   return __ret;
  46325 }
  46326 #endif
  46327 
  46328 #ifdef __LITTLE_ENDIAN__
  46329 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_s16(int16x8_t __p0) {
  46330   uint16x8_t __ret;
  46331   __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 49);
  46332   return __ret;
  46333 }
  46334 #else
  46335 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_s16(int16x8_t __p0) {
  46336   uint16x8_t __ret;
  46337   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46338   __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 49);
  46339   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46340   return __ret;
  46341 }
  46342 #endif
  46343 
  46344 #ifdef __LITTLE_ENDIAN__
  46345 __ai __attribute__((target("neon"))) uint8x8_t vceqz_u8(uint8x8_t __p0) {
  46346   uint8x8_t __ret;
  46347   __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 16);
  46348   return __ret;
  46349 }
  46350 #else
  46351 __ai __attribute__((target("neon"))) uint8x8_t vceqz_u8(uint8x8_t __p0) {
  46352   uint8x8_t __ret;
  46353   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46354   __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 16);
  46355   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46356   return __ret;
  46357 }
  46358 #endif
  46359 
  46360 #ifdef __LITTLE_ENDIAN__
  46361 __ai __attribute__((target("neon"))) uint32x2_t vceqz_u32(uint32x2_t __p0) {
  46362   uint32x2_t __ret;
  46363   __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 18);
  46364   return __ret;
  46365 }
  46366 #else
  46367 __ai __attribute__((target("neon"))) uint32x2_t vceqz_u32(uint32x2_t __p0) {
  46368   uint32x2_t __ret;
  46369   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46370   __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 18);
  46371   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46372   return __ret;
  46373 }
  46374 #endif
  46375 
  46376 __ai __attribute__((target("neon"))) uint64x1_t vceqz_u64(uint64x1_t __p0) {
  46377   uint64x1_t __ret;
  46378   __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19);
  46379   return __ret;
  46380 }
  46381 #ifdef __LITTLE_ENDIAN__
  46382 __ai __attribute__((target("neon"))) uint16x4_t vceqz_u16(uint16x4_t __p0) {
  46383   uint16x4_t __ret;
  46384   __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 17);
  46385   return __ret;
  46386 }
  46387 #else
  46388 __ai __attribute__((target("neon"))) uint16x4_t vceqz_u16(uint16x4_t __p0) {
  46389   uint16x4_t __ret;
  46390   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46391   __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 17);
  46392   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46393   return __ret;
  46394 }
  46395 #endif
  46396 
  46397 #ifdef __LITTLE_ENDIAN__
  46398 __ai __attribute__((target("neon"))) uint8x8_t vceqz_s8(int8x8_t __p0) {
  46399   uint8x8_t __ret;
  46400   __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 16);
  46401   return __ret;
  46402 }
  46403 #else
  46404 __ai __attribute__((target("neon"))) uint8x8_t vceqz_s8(int8x8_t __p0) {
  46405   uint8x8_t __ret;
  46406   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46407   __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 16);
  46408   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46409   return __ret;
  46410 }
  46411 #endif
  46412 
  46413 __ai __attribute__((target("neon"))) uint64x1_t vceqz_f64(float64x1_t __p0) {
  46414   uint64x1_t __ret;
  46415   __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19);
  46416   return __ret;
  46417 }
  46418 #ifdef __LITTLE_ENDIAN__
  46419 __ai __attribute__((target("neon"))) uint32x2_t vceqz_f32(float32x2_t __p0) {
  46420   uint32x2_t __ret;
  46421   __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 18);
  46422   return __ret;
  46423 }
  46424 #else
  46425 __ai __attribute__((target("neon"))) uint32x2_t vceqz_f32(float32x2_t __p0) {
  46426   uint32x2_t __ret;
  46427   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46428   __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 18);
  46429   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46430   return __ret;
  46431 }
  46432 #endif
  46433 
  46434 #ifdef __LITTLE_ENDIAN__
  46435 __ai __attribute__((target("neon"))) uint32x2_t vceqz_s32(int32x2_t __p0) {
  46436   uint32x2_t __ret;
  46437   __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 18);
  46438   return __ret;
  46439 }
  46440 #else
  46441 __ai __attribute__((target("neon"))) uint32x2_t vceqz_s32(int32x2_t __p0) {
  46442   uint32x2_t __ret;
  46443   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46444   __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 18);
  46445   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46446   return __ret;
  46447 }
  46448 #endif
  46449 
  46450 __ai __attribute__((target("neon"))) uint64x1_t vceqz_s64(int64x1_t __p0) {
  46451   uint64x1_t __ret;
  46452   __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19);
  46453   return __ret;
  46454 }
  46455 #ifdef __LITTLE_ENDIAN__
  46456 __ai __attribute__((target("neon"))) uint16x4_t vceqz_s16(int16x4_t __p0) {
  46457   uint16x4_t __ret;
  46458   __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 17);
  46459   return __ret;
  46460 }
  46461 #else
  46462 __ai __attribute__((target("neon"))) uint16x4_t vceqz_s16(int16x4_t __p0) {
  46463   uint16x4_t __ret;
  46464   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46465   __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 17);
  46466   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46467   return __ret;
  46468 }
  46469 #endif
  46470 
  46471 __ai __attribute__((target("neon"))) uint64_t vceqzd_u64(uint64_t __p0) {
  46472   uint64_t __ret;
  46473   __ret = (uint64_t) __builtin_neon_vceqzd_u64(__p0);
  46474   return __ret;
  46475 }
  46476 __ai __attribute__((target("neon"))) uint64_t vceqzd_s64(int64_t __p0) {
  46477   uint64_t __ret;
  46478   __ret = (uint64_t) __builtin_neon_vceqzd_s64(__p0);
  46479   return __ret;
  46480 }
  46481 __ai __attribute__((target("neon"))) uint64_t vceqzd_f64(float64_t __p0) {
  46482   uint64_t __ret;
  46483   __ret = (uint64_t) __builtin_neon_vceqzd_f64(__p0);
  46484   return __ret;
  46485 }
  46486 __ai __attribute__((target("neon"))) uint32_t vceqzs_f32(float32_t __p0) {
  46487   uint32_t __ret;
  46488   __ret = (uint32_t) __builtin_neon_vceqzs_f32(__p0);
  46489   return __ret;
  46490 }
  46491 #ifdef __LITTLE_ENDIAN__
  46492 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  46493   uint64x2_t __ret;
  46494   __ret = (uint64x2_t)(__p0 >= __p1);
  46495   return __ret;
  46496 }
  46497 #else
  46498 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  46499   uint64x2_t __ret;
  46500   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46501   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46502   __ret = (uint64x2_t)(__rev0 >= __rev1);
  46503   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46504   return __ret;
  46505 }
  46506 #endif
  46507 
  46508 #ifdef __LITTLE_ENDIAN__
  46509 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_f64(float64x2_t __p0, float64x2_t __p1) {
  46510   uint64x2_t __ret;
  46511   __ret = (uint64x2_t)(__p0 >= __p1);
  46512   return __ret;
  46513 }
  46514 #else
  46515 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_f64(float64x2_t __p0, float64x2_t __p1) {
  46516   uint64x2_t __ret;
  46517   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46518   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46519   __ret = (uint64x2_t)(__rev0 >= __rev1);
  46520   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46521   return __ret;
  46522 }
  46523 #endif
  46524 
  46525 #ifdef __LITTLE_ENDIAN__
  46526 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_s64(int64x2_t __p0, int64x2_t __p1) {
  46527   uint64x2_t __ret;
  46528   __ret = (uint64x2_t)(__p0 >= __p1);
  46529   return __ret;
  46530 }
  46531 #else
  46532 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_s64(int64x2_t __p0, int64x2_t __p1) {
  46533   uint64x2_t __ret;
  46534   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46535   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46536   __ret = (uint64x2_t)(__rev0 >= __rev1);
  46537   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46538   return __ret;
  46539 }
  46540 #endif
  46541 
  46542 __ai __attribute__((target("neon"))) uint64x1_t vcge_u64(uint64x1_t __p0, uint64x1_t __p1) {
  46543   uint64x1_t __ret;
  46544   __ret = (uint64x1_t)(__p0 >= __p1);
  46545   return __ret;
  46546 }
  46547 __ai __attribute__((target("neon"))) uint64x1_t vcge_f64(float64x1_t __p0, float64x1_t __p1) {
  46548   uint64x1_t __ret;
  46549   __ret = (uint64x1_t)(__p0 >= __p1);
  46550   return __ret;
  46551 }
  46552 __ai __attribute__((target("neon"))) uint64x1_t vcge_s64(int64x1_t __p0, int64x1_t __p1) {
  46553   uint64x1_t __ret;
  46554   __ret = (uint64x1_t)(__p0 >= __p1);
  46555   return __ret;
  46556 }
  46557 __ai __attribute__((target("neon"))) uint64_t vcged_s64(int64_t __p0, int64_t __p1) {
  46558   uint64_t __ret;
  46559   __ret = (uint64_t) __builtin_neon_vcged_s64(__p0, __p1);
  46560   return __ret;
  46561 }
  46562 __ai __attribute__((target("neon"))) uint64_t vcged_u64(uint64_t __p0, uint64_t __p1) {
  46563   uint64_t __ret;
  46564   __ret = (uint64_t) __builtin_neon_vcged_u64(__p0, __p1);
  46565   return __ret;
  46566 }
  46567 __ai __attribute__((target("neon"))) uint64_t vcged_f64(float64_t __p0, float64_t __p1) {
  46568   uint64_t __ret;
  46569   __ret = (uint64_t) __builtin_neon_vcged_f64(__p0, __p1);
  46570   return __ret;
  46571 }
  46572 __ai __attribute__((target("neon"))) uint32_t vcges_f32(float32_t __p0, float32_t __p1) {
  46573   uint32_t __ret;
  46574   __ret = (uint32_t) __builtin_neon_vcges_f32(__p0, __p1);
  46575   return __ret;
  46576 }
  46577 #ifdef __LITTLE_ENDIAN__
  46578 __ai __attribute__((target("neon"))) uint8x16_t vcgezq_s8(int8x16_t __p0) {
  46579   uint8x16_t __ret;
  46580   __ret = (uint8x16_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 48);
  46581   return __ret;
  46582 }
  46583 #else
  46584 __ai __attribute__((target("neon"))) uint8x16_t vcgezq_s8(int8x16_t __p0) {
  46585   uint8x16_t __ret;
  46586   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46587   __ret = (uint8x16_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 48);
  46588   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46589   return __ret;
  46590 }
  46591 #endif
  46592 
  46593 #ifdef __LITTLE_ENDIAN__
  46594 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_f64(float64x2_t __p0) {
  46595   uint64x2_t __ret;
  46596   __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 51);
  46597   return __ret;
  46598 }
  46599 #else
  46600 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_f64(float64x2_t __p0) {
  46601   uint64x2_t __ret;
  46602   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46603   __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 51);
  46604   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46605   return __ret;
  46606 }
  46607 #endif
  46608 
  46609 #ifdef __LITTLE_ENDIAN__
  46610 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_f32(float32x4_t __p0) {
  46611   uint32x4_t __ret;
  46612   __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 50);
  46613   return __ret;
  46614 }
  46615 #else
  46616 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_f32(float32x4_t __p0) {
  46617   uint32x4_t __ret;
  46618   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46619   __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 50);
  46620   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46621   return __ret;
  46622 }
  46623 #endif
  46624 
  46625 #ifdef __LITTLE_ENDIAN__
  46626 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_s32(int32x4_t __p0) {
  46627   uint32x4_t __ret;
  46628   __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 50);
  46629   return __ret;
  46630 }
  46631 #else
  46632 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_s32(int32x4_t __p0) {
  46633   uint32x4_t __ret;
  46634   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46635   __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 50);
  46636   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46637   return __ret;
  46638 }
  46639 #endif
  46640 
  46641 #ifdef __LITTLE_ENDIAN__
  46642 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_s64(int64x2_t __p0) {
  46643   uint64x2_t __ret;
  46644   __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 51);
  46645   return __ret;
  46646 }
  46647 #else
  46648 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_s64(int64x2_t __p0) {
  46649   uint64x2_t __ret;
  46650   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46651   __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 51);
  46652   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46653   return __ret;
  46654 }
  46655 #endif
  46656 
  46657 #ifdef __LITTLE_ENDIAN__
  46658 __ai __attribute__((target("neon"))) uint16x8_t vcgezq_s16(int16x8_t __p0) {
  46659   uint16x8_t __ret;
  46660   __ret = (uint16x8_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 49);
  46661   return __ret;
  46662 }
  46663 #else
  46664 __ai __attribute__((target("neon"))) uint16x8_t vcgezq_s16(int16x8_t __p0) {
  46665   uint16x8_t __ret;
  46666   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46667   __ret = (uint16x8_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 49);
  46668   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46669   return __ret;
  46670 }
  46671 #endif
  46672 
  46673 #ifdef __LITTLE_ENDIAN__
  46674 __ai __attribute__((target("neon"))) uint8x8_t vcgez_s8(int8x8_t __p0) {
  46675   uint8x8_t __ret;
  46676   __ret = (uint8x8_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 16);
  46677   return __ret;
  46678 }
  46679 #else
  46680 __ai __attribute__((target("neon"))) uint8x8_t vcgez_s8(int8x8_t __p0) {
  46681   uint8x8_t __ret;
  46682   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46683   __ret = (uint8x8_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 16);
  46684   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46685   return __ret;
  46686 }
  46687 #endif
  46688 
  46689 __ai __attribute__((target("neon"))) uint64x1_t vcgez_f64(float64x1_t __p0) {
  46690   uint64x1_t __ret;
  46691   __ret = (uint64x1_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 19);
  46692   return __ret;
  46693 }
  46694 #ifdef __LITTLE_ENDIAN__
  46695 __ai __attribute__((target("neon"))) uint32x2_t vcgez_f32(float32x2_t __p0) {
  46696   uint32x2_t __ret;
  46697   __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 18);
  46698   return __ret;
  46699 }
  46700 #else
  46701 __ai __attribute__((target("neon"))) uint32x2_t vcgez_f32(float32x2_t __p0) {
  46702   uint32x2_t __ret;
  46703   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46704   __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 18);
  46705   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46706   return __ret;
  46707 }
  46708 #endif
  46709 
  46710 #ifdef __LITTLE_ENDIAN__
  46711 __ai __attribute__((target("neon"))) uint32x2_t vcgez_s32(int32x2_t __p0) {
  46712   uint32x2_t __ret;
  46713   __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 18);
  46714   return __ret;
  46715 }
  46716 #else
  46717 __ai __attribute__((target("neon"))) uint32x2_t vcgez_s32(int32x2_t __p0) {
  46718   uint32x2_t __ret;
  46719   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46720   __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 18);
  46721   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46722   return __ret;
  46723 }
  46724 #endif
  46725 
  46726 __ai __attribute__((target("neon"))) uint64x1_t vcgez_s64(int64x1_t __p0) {
  46727   uint64x1_t __ret;
  46728   __ret = (uint64x1_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 19);
  46729   return __ret;
  46730 }
  46731 #ifdef __LITTLE_ENDIAN__
  46732 __ai __attribute__((target("neon"))) uint16x4_t vcgez_s16(int16x4_t __p0) {
  46733   uint16x4_t __ret;
  46734   __ret = (uint16x4_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 17);
  46735   return __ret;
  46736 }
  46737 #else
  46738 __ai __attribute__((target("neon"))) uint16x4_t vcgez_s16(int16x4_t __p0) {
  46739   uint16x4_t __ret;
  46740   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46741   __ret = (uint16x4_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 17);
  46742   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46743   return __ret;
  46744 }
  46745 #endif
  46746 
  46747 __ai __attribute__((target("neon"))) uint64_t vcgezd_s64(int64_t __p0) {
  46748   uint64_t __ret;
  46749   __ret = (uint64_t) __builtin_neon_vcgezd_s64(__p0);
  46750   return __ret;
  46751 }
  46752 __ai __attribute__((target("neon"))) uint64_t vcgezd_f64(float64_t __p0) {
  46753   uint64_t __ret;
  46754   __ret = (uint64_t) __builtin_neon_vcgezd_f64(__p0);
  46755   return __ret;
  46756 }
  46757 __ai __attribute__((target("neon"))) uint32_t vcgezs_f32(float32_t __p0) {
  46758   uint32_t __ret;
  46759   __ret = (uint32_t) __builtin_neon_vcgezs_f32(__p0);
  46760   return __ret;
  46761 }
  46762 #ifdef __LITTLE_ENDIAN__
  46763 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  46764   uint64x2_t __ret;
  46765   __ret = (uint64x2_t)(__p0 > __p1);
  46766   return __ret;
  46767 }
  46768 #else
  46769 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  46770   uint64x2_t __ret;
  46771   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46772   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46773   __ret = (uint64x2_t)(__rev0 > __rev1);
  46774   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46775   return __ret;
  46776 }
  46777 #endif
  46778 
  46779 #ifdef __LITTLE_ENDIAN__
  46780 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_f64(float64x2_t __p0, float64x2_t __p1) {
  46781   uint64x2_t __ret;
  46782   __ret = (uint64x2_t)(__p0 > __p1);
  46783   return __ret;
  46784 }
  46785 #else
  46786 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_f64(float64x2_t __p0, float64x2_t __p1) {
  46787   uint64x2_t __ret;
  46788   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46789   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46790   __ret = (uint64x2_t)(__rev0 > __rev1);
  46791   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46792   return __ret;
  46793 }
  46794 #endif
  46795 
  46796 #ifdef __LITTLE_ENDIAN__
  46797 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_s64(int64x2_t __p0, int64x2_t __p1) {
  46798   uint64x2_t __ret;
  46799   __ret = (uint64x2_t)(__p0 > __p1);
  46800   return __ret;
  46801 }
  46802 #else
  46803 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_s64(int64x2_t __p0, int64x2_t __p1) {
  46804   uint64x2_t __ret;
  46805   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46806   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  46807   __ret = (uint64x2_t)(__rev0 > __rev1);
  46808   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46809   return __ret;
  46810 }
  46811 #endif
  46812 
  46813 __ai __attribute__((target("neon"))) uint64x1_t vcgt_u64(uint64x1_t __p0, uint64x1_t __p1) {
  46814   uint64x1_t __ret;
  46815   __ret = (uint64x1_t)(__p0 > __p1);
  46816   return __ret;
  46817 }
  46818 __ai __attribute__((target("neon"))) uint64x1_t vcgt_f64(float64x1_t __p0, float64x1_t __p1) {
  46819   uint64x1_t __ret;
  46820   __ret = (uint64x1_t)(__p0 > __p1);
  46821   return __ret;
  46822 }
  46823 __ai __attribute__((target("neon"))) uint64x1_t vcgt_s64(int64x1_t __p0, int64x1_t __p1) {
  46824   uint64x1_t __ret;
  46825   __ret = (uint64x1_t)(__p0 > __p1);
  46826   return __ret;
  46827 }
  46828 __ai __attribute__((target("neon"))) uint64_t vcgtd_s64(int64_t __p0, int64_t __p1) {
  46829   uint64_t __ret;
  46830   __ret = (uint64_t) __builtin_neon_vcgtd_s64(__p0, __p1);
  46831   return __ret;
  46832 }
  46833 __ai __attribute__((target("neon"))) uint64_t vcgtd_u64(uint64_t __p0, uint64_t __p1) {
  46834   uint64_t __ret;
  46835   __ret = (uint64_t) __builtin_neon_vcgtd_u64(__p0, __p1);
  46836   return __ret;
  46837 }
  46838 __ai __attribute__((target("neon"))) uint64_t vcgtd_f64(float64_t __p0, float64_t __p1) {
  46839   uint64_t __ret;
  46840   __ret = (uint64_t) __builtin_neon_vcgtd_f64(__p0, __p1);
  46841   return __ret;
  46842 }
  46843 __ai __attribute__((target("neon"))) uint32_t vcgts_f32(float32_t __p0, float32_t __p1) {
  46844   uint32_t __ret;
  46845   __ret = (uint32_t) __builtin_neon_vcgts_f32(__p0, __p1);
  46846   return __ret;
  46847 }
  46848 #ifdef __LITTLE_ENDIAN__
  46849 __ai __attribute__((target("neon"))) uint8x16_t vcgtzq_s8(int8x16_t __p0) {
  46850   uint8x16_t __ret;
  46851   __ret = (uint8x16_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 48);
  46852   return __ret;
  46853 }
  46854 #else
  46855 __ai __attribute__((target("neon"))) uint8x16_t vcgtzq_s8(int8x16_t __p0) {
  46856   uint8x16_t __ret;
  46857   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46858   __ret = (uint8x16_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 48);
  46859   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  46860   return __ret;
  46861 }
  46862 #endif
  46863 
  46864 #ifdef __LITTLE_ENDIAN__
  46865 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_f64(float64x2_t __p0) {
  46866   uint64x2_t __ret;
  46867   __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 51);
  46868   return __ret;
  46869 }
  46870 #else
  46871 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_f64(float64x2_t __p0) {
  46872   uint64x2_t __ret;
  46873   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46874   __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 51);
  46875   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46876   return __ret;
  46877 }
  46878 #endif
  46879 
  46880 #ifdef __LITTLE_ENDIAN__
  46881 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_f32(float32x4_t __p0) {
  46882   uint32x4_t __ret;
  46883   __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 50);
  46884   return __ret;
  46885 }
  46886 #else
  46887 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_f32(float32x4_t __p0) {
  46888   uint32x4_t __ret;
  46889   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46890   __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 50);
  46891   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46892   return __ret;
  46893 }
  46894 #endif
  46895 
  46896 #ifdef __LITTLE_ENDIAN__
  46897 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_s32(int32x4_t __p0) {
  46898   uint32x4_t __ret;
  46899   __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 50);
  46900   return __ret;
  46901 }
  46902 #else
  46903 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_s32(int32x4_t __p0) {
  46904   uint32x4_t __ret;
  46905   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  46906   __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 50);
  46907   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  46908   return __ret;
  46909 }
  46910 #endif
  46911 
  46912 #ifdef __LITTLE_ENDIAN__
  46913 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_s64(int64x2_t __p0) {
  46914   uint64x2_t __ret;
  46915   __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 51);
  46916   return __ret;
  46917 }
  46918 #else
  46919 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_s64(int64x2_t __p0) {
  46920   uint64x2_t __ret;
  46921   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46922   __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 51);
  46923   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46924   return __ret;
  46925 }
  46926 #endif
  46927 
  46928 #ifdef __LITTLE_ENDIAN__
  46929 __ai __attribute__((target("neon"))) uint16x8_t vcgtzq_s16(int16x8_t __p0) {
  46930   uint16x8_t __ret;
  46931   __ret = (uint16x8_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 49);
  46932   return __ret;
  46933 }
  46934 #else
  46935 __ai __attribute__((target("neon"))) uint16x8_t vcgtzq_s16(int16x8_t __p0) {
  46936   uint16x8_t __ret;
  46937   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46938   __ret = (uint16x8_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 49);
  46939   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46940   return __ret;
  46941 }
  46942 #endif
  46943 
  46944 #ifdef __LITTLE_ENDIAN__
  46945 __ai __attribute__((target("neon"))) uint8x8_t vcgtz_s8(int8x8_t __p0) {
  46946   uint8x8_t __ret;
  46947   __ret = (uint8x8_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 16);
  46948   return __ret;
  46949 }
  46950 #else
  46951 __ai __attribute__((target("neon"))) uint8x8_t vcgtz_s8(int8x8_t __p0) {
  46952   uint8x8_t __ret;
  46953   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  46954   __ret = (uint8x8_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 16);
  46955   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  46956   return __ret;
  46957 }
  46958 #endif
  46959 
  46960 __ai __attribute__((target("neon"))) uint64x1_t vcgtz_f64(float64x1_t __p0) {
  46961   uint64x1_t __ret;
  46962   __ret = (uint64x1_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 19);
  46963   return __ret;
  46964 }
  46965 #ifdef __LITTLE_ENDIAN__
  46966 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_f32(float32x2_t __p0) {
  46967   uint32x2_t __ret;
  46968   __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 18);
  46969   return __ret;
  46970 }
  46971 #else
  46972 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_f32(float32x2_t __p0) {
  46973   uint32x2_t __ret;
  46974   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46975   __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 18);
  46976   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46977   return __ret;
  46978 }
  46979 #endif
  46980 
  46981 #ifdef __LITTLE_ENDIAN__
  46982 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_s32(int32x2_t __p0) {
  46983   uint32x2_t __ret;
  46984   __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 18);
  46985   return __ret;
  46986 }
  46987 #else
  46988 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_s32(int32x2_t __p0) {
  46989   uint32x2_t __ret;
  46990   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  46991   __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 18);
  46992   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  46993   return __ret;
  46994 }
  46995 #endif
  46996 
  46997 __ai __attribute__((target("neon"))) uint64x1_t vcgtz_s64(int64x1_t __p0) {
  46998   uint64x1_t __ret;
  46999   __ret = (uint64x1_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 19);
  47000   return __ret;
  47001 }
  47002 #ifdef __LITTLE_ENDIAN__
  47003 __ai __attribute__((target("neon"))) uint16x4_t vcgtz_s16(int16x4_t __p0) {
  47004   uint16x4_t __ret;
  47005   __ret = (uint16x4_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 17);
  47006   return __ret;
  47007 }
  47008 #else
  47009 __ai __attribute__((target("neon"))) uint16x4_t vcgtz_s16(int16x4_t __p0) {
  47010   uint16x4_t __ret;
  47011   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47012   __ret = (uint16x4_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 17);
  47013   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47014   return __ret;
  47015 }
  47016 #endif
  47017 
  47018 __ai __attribute__((target("neon"))) uint64_t vcgtzd_s64(int64_t __p0) {
  47019   uint64_t __ret;
  47020   __ret = (uint64_t) __builtin_neon_vcgtzd_s64(__p0);
  47021   return __ret;
  47022 }
  47023 __ai __attribute__((target("neon"))) uint64_t vcgtzd_f64(float64_t __p0) {
  47024   uint64_t __ret;
  47025   __ret = (uint64_t) __builtin_neon_vcgtzd_f64(__p0);
  47026   return __ret;
  47027 }
  47028 __ai __attribute__((target("neon"))) uint32_t vcgtzs_f32(float32_t __p0) {
  47029   uint32_t __ret;
  47030   __ret = (uint32_t) __builtin_neon_vcgtzs_f32(__p0);
  47031   return __ret;
  47032 }
  47033 #ifdef __LITTLE_ENDIAN__
  47034 __ai __attribute__((target("neon"))) uint64x2_t vcleq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  47035   uint64x2_t __ret;
  47036   __ret = (uint64x2_t)(__p0 <= __p1);
  47037   return __ret;
  47038 }
  47039 #else
  47040 __ai __attribute__((target("neon"))) uint64x2_t vcleq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  47041   uint64x2_t __ret;
  47042   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47043   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  47044   __ret = (uint64x2_t)(__rev0 <= __rev1);
  47045   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47046   return __ret;
  47047 }
  47048 #endif
  47049 
  47050 #ifdef __LITTLE_ENDIAN__
  47051 __ai __attribute__((target("neon"))) uint64x2_t vcleq_f64(float64x2_t __p0, float64x2_t __p1) {
  47052   uint64x2_t __ret;
  47053   __ret = (uint64x2_t)(__p0 <= __p1);
  47054   return __ret;
  47055 }
  47056 #else
  47057 __ai __attribute__((target("neon"))) uint64x2_t vcleq_f64(float64x2_t __p0, float64x2_t __p1) {
  47058   uint64x2_t __ret;
  47059   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47060   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  47061   __ret = (uint64x2_t)(__rev0 <= __rev1);
  47062   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47063   return __ret;
  47064 }
  47065 #endif
  47066 
  47067 #ifdef __LITTLE_ENDIAN__
  47068 __ai __attribute__((target("neon"))) uint64x2_t vcleq_s64(int64x2_t __p0, int64x2_t __p1) {
  47069   uint64x2_t __ret;
  47070   __ret = (uint64x2_t)(__p0 <= __p1);
  47071   return __ret;
  47072 }
  47073 #else
  47074 __ai __attribute__((target("neon"))) uint64x2_t vcleq_s64(int64x2_t __p0, int64x2_t __p1) {
  47075   uint64x2_t __ret;
  47076   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47077   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  47078   __ret = (uint64x2_t)(__rev0 <= __rev1);
  47079   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47080   return __ret;
  47081 }
  47082 #endif
  47083 
  47084 __ai __attribute__((target("neon"))) uint64x1_t vcle_u64(uint64x1_t __p0, uint64x1_t __p1) {
  47085   uint64x1_t __ret;
  47086   __ret = (uint64x1_t)(__p0 <= __p1);
  47087   return __ret;
  47088 }
  47089 __ai __attribute__((target("neon"))) uint64x1_t vcle_f64(float64x1_t __p0, float64x1_t __p1) {
  47090   uint64x1_t __ret;
  47091   __ret = (uint64x1_t)(__p0 <= __p1);
  47092   return __ret;
  47093 }
  47094 __ai __attribute__((target("neon"))) uint64x1_t vcle_s64(int64x1_t __p0, int64x1_t __p1) {
  47095   uint64x1_t __ret;
  47096   __ret = (uint64x1_t)(__p0 <= __p1);
  47097   return __ret;
  47098 }
  47099 __ai __attribute__((target("neon"))) uint64_t vcled_u64(uint64_t __p0, uint64_t __p1) {
  47100   uint64_t __ret;
  47101   __ret = (uint64_t) __builtin_neon_vcled_u64(__p0, __p1);
  47102   return __ret;
  47103 }
  47104 __ai __attribute__((target("neon"))) uint64_t vcled_s64(int64_t __p0, int64_t __p1) {
  47105   uint64_t __ret;
  47106   __ret = (uint64_t) __builtin_neon_vcled_s64(__p0, __p1);
  47107   return __ret;
  47108 }
  47109 __ai __attribute__((target("neon"))) uint64_t vcled_f64(float64_t __p0, float64_t __p1) {
  47110   uint64_t __ret;
  47111   __ret = (uint64_t) __builtin_neon_vcled_f64(__p0, __p1);
  47112   return __ret;
  47113 }
  47114 __ai __attribute__((target("neon"))) uint32_t vcles_f32(float32_t __p0, float32_t __p1) {
  47115   uint32_t __ret;
  47116   __ret = (uint32_t) __builtin_neon_vcles_f32(__p0, __p1);
  47117   return __ret;
  47118 }
  47119 #ifdef __LITTLE_ENDIAN__
  47120 __ai __attribute__((target("neon"))) uint8x16_t vclezq_s8(int8x16_t __p0) {
  47121   uint8x16_t __ret;
  47122   __ret = (uint8x16_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 48);
  47123   return __ret;
  47124 }
  47125 #else
  47126 __ai __attribute__((target("neon"))) uint8x16_t vclezq_s8(int8x16_t __p0) {
  47127   uint8x16_t __ret;
  47128   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  47129   __ret = (uint8x16_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 48);
  47130   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  47131   return __ret;
  47132 }
  47133 #endif
  47134 
  47135 #ifdef __LITTLE_ENDIAN__
  47136 __ai __attribute__((target("neon"))) uint64x2_t vclezq_f64(float64x2_t __p0) {
  47137   uint64x2_t __ret;
  47138   __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 51);
  47139   return __ret;
  47140 }
  47141 #else
  47142 __ai __attribute__((target("neon"))) uint64x2_t vclezq_f64(float64x2_t __p0) {
  47143   uint64x2_t __ret;
  47144   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47145   __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 51);
  47146   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47147   return __ret;
  47148 }
  47149 #endif
  47150 
  47151 #ifdef __LITTLE_ENDIAN__
  47152 __ai __attribute__((target("neon"))) uint32x4_t vclezq_f32(float32x4_t __p0) {
  47153   uint32x4_t __ret;
  47154   __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 50);
  47155   return __ret;
  47156 }
  47157 #else
  47158 __ai __attribute__((target("neon"))) uint32x4_t vclezq_f32(float32x4_t __p0) {
  47159   uint32x4_t __ret;
  47160   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47161   __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 50);
  47162   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47163   return __ret;
  47164 }
  47165 #endif
  47166 
  47167 #ifdef __LITTLE_ENDIAN__
  47168 __ai __attribute__((target("neon"))) uint32x4_t vclezq_s32(int32x4_t __p0) {
  47169   uint32x4_t __ret;
  47170   __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 50);
  47171   return __ret;
  47172 }
  47173 #else
  47174 __ai __attribute__((target("neon"))) uint32x4_t vclezq_s32(int32x4_t __p0) {
  47175   uint32x4_t __ret;
  47176   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47177   __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 50);
  47178   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47179   return __ret;
  47180 }
  47181 #endif
  47182 
  47183 #ifdef __LITTLE_ENDIAN__
  47184 __ai __attribute__((target("neon"))) uint64x2_t vclezq_s64(int64x2_t __p0) {
  47185   uint64x2_t __ret;
  47186   __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 51);
  47187   return __ret;
  47188 }
  47189 #else
  47190 __ai __attribute__((target("neon"))) uint64x2_t vclezq_s64(int64x2_t __p0) {
  47191   uint64x2_t __ret;
  47192   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47193   __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 51);
  47194   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47195   return __ret;
  47196 }
  47197 #endif
  47198 
  47199 #ifdef __LITTLE_ENDIAN__
  47200 __ai __attribute__((target("neon"))) uint16x8_t vclezq_s16(int16x8_t __p0) {
  47201   uint16x8_t __ret;
  47202   __ret = (uint16x8_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 49);
  47203   return __ret;
  47204 }
  47205 #else
  47206 __ai __attribute__((target("neon"))) uint16x8_t vclezq_s16(int16x8_t __p0) {
  47207   uint16x8_t __ret;
  47208   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  47209   __ret = (uint16x8_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 49);
  47210   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  47211   return __ret;
  47212 }
  47213 #endif
  47214 
  47215 #ifdef __LITTLE_ENDIAN__
  47216 __ai __attribute__((target("neon"))) uint8x8_t vclez_s8(int8x8_t __p0) {
  47217   uint8x8_t __ret;
  47218   __ret = (uint8x8_t) __builtin_neon_vclez_v((int8x8_t)__p0, 16);
  47219   return __ret;
  47220 }
  47221 #else
  47222 __ai __attribute__((target("neon"))) uint8x8_t vclez_s8(int8x8_t __p0) {
  47223   uint8x8_t __ret;
  47224   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  47225   __ret = (uint8x8_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 16);
  47226   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  47227   return __ret;
  47228 }
  47229 #endif
  47230 
  47231 __ai __attribute__((target("neon"))) uint64x1_t vclez_f64(float64x1_t __p0) {
  47232   uint64x1_t __ret;
  47233   __ret = (uint64x1_t) __builtin_neon_vclez_v((int8x8_t)__p0, 19);
  47234   return __ret;
  47235 }
  47236 #ifdef __LITTLE_ENDIAN__
  47237 __ai __attribute__((target("neon"))) uint32x2_t vclez_f32(float32x2_t __p0) {
  47238   uint32x2_t __ret;
  47239   __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__p0, 18);
  47240   return __ret;
  47241 }
  47242 #else
  47243 __ai __attribute__((target("neon"))) uint32x2_t vclez_f32(float32x2_t __p0) {
  47244   uint32x2_t __ret;
  47245   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47246   __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 18);
  47247   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47248   return __ret;
  47249 }
  47250 #endif
  47251 
  47252 #ifdef __LITTLE_ENDIAN__
  47253 __ai __attribute__((target("neon"))) uint32x2_t vclez_s32(int32x2_t __p0) {
  47254   uint32x2_t __ret;
  47255   __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__p0, 18);
  47256   return __ret;
  47257 }
  47258 #else
  47259 __ai __attribute__((target("neon"))) uint32x2_t vclez_s32(int32x2_t __p0) {
  47260   uint32x2_t __ret;
  47261   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47262   __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 18);
  47263   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47264   return __ret;
  47265 }
  47266 #endif
  47267 
  47268 __ai __attribute__((target("neon"))) uint64x1_t vclez_s64(int64x1_t __p0) {
  47269   uint64x1_t __ret;
  47270   __ret = (uint64x1_t) __builtin_neon_vclez_v((int8x8_t)__p0, 19);
  47271   return __ret;
  47272 }
  47273 #ifdef __LITTLE_ENDIAN__
  47274 __ai __attribute__((target("neon"))) uint16x4_t vclez_s16(int16x4_t __p0) {
  47275   uint16x4_t __ret;
  47276   __ret = (uint16x4_t) __builtin_neon_vclez_v((int8x8_t)__p0, 17);
  47277   return __ret;
  47278 }
  47279 #else
  47280 __ai __attribute__((target("neon"))) uint16x4_t vclez_s16(int16x4_t __p0) {
  47281   uint16x4_t __ret;
  47282   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47283   __ret = (uint16x4_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 17);
  47284   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47285   return __ret;
  47286 }
  47287 #endif
  47288 
  47289 __ai __attribute__((target("neon"))) uint64_t vclezd_s64(int64_t __p0) {
  47290   uint64_t __ret;
  47291   __ret = (uint64_t) __builtin_neon_vclezd_s64(__p0);
  47292   return __ret;
  47293 }
  47294 __ai __attribute__((target("neon"))) uint64_t vclezd_f64(float64_t __p0) {
  47295   uint64_t __ret;
  47296   __ret = (uint64_t) __builtin_neon_vclezd_f64(__p0);
  47297   return __ret;
  47298 }
  47299 __ai __attribute__((target("neon"))) uint32_t vclezs_f32(float32_t __p0) {
  47300   uint32_t __ret;
  47301   __ret = (uint32_t) __builtin_neon_vclezs_f32(__p0);
  47302   return __ret;
  47303 }
  47304 #ifdef __LITTLE_ENDIAN__
  47305 __ai __attribute__((target("neon"))) uint64x2_t vcltq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  47306   uint64x2_t __ret;
  47307   __ret = (uint64x2_t)(__p0 < __p1);
  47308   return __ret;
  47309 }
  47310 #else
  47311 __ai __attribute__((target("neon"))) uint64x2_t vcltq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  47312   uint64x2_t __ret;
  47313   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47314   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  47315   __ret = (uint64x2_t)(__rev0 < __rev1);
  47316   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47317   return __ret;
  47318 }
  47319 #endif
  47320 
  47321 #ifdef __LITTLE_ENDIAN__
  47322 __ai __attribute__((target("neon"))) uint64x2_t vcltq_f64(float64x2_t __p0, float64x2_t __p1) {
  47323   uint64x2_t __ret;
  47324   __ret = (uint64x2_t)(__p0 < __p1);
  47325   return __ret;
  47326 }
  47327 #else
  47328 __ai __attribute__((target("neon"))) uint64x2_t vcltq_f64(float64x2_t __p0, float64x2_t __p1) {
  47329   uint64x2_t __ret;
  47330   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47331   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  47332   __ret = (uint64x2_t)(__rev0 < __rev1);
  47333   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47334   return __ret;
  47335 }
  47336 #endif
  47337 
  47338 #ifdef __LITTLE_ENDIAN__
  47339 __ai __attribute__((target("neon"))) uint64x2_t vcltq_s64(int64x2_t __p0, int64x2_t __p1) {
  47340   uint64x2_t __ret;
  47341   __ret = (uint64x2_t)(__p0 < __p1);
  47342   return __ret;
  47343 }
  47344 #else
  47345 __ai __attribute__((target("neon"))) uint64x2_t vcltq_s64(int64x2_t __p0, int64x2_t __p1) {
  47346   uint64x2_t __ret;
  47347   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47348   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  47349   __ret = (uint64x2_t)(__rev0 < __rev1);
  47350   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47351   return __ret;
  47352 }
  47353 #endif
  47354 
  47355 __ai __attribute__((target("neon"))) uint64x1_t vclt_u64(uint64x1_t __p0, uint64x1_t __p1) {
  47356   uint64x1_t __ret;
  47357   __ret = (uint64x1_t)(__p0 < __p1);
  47358   return __ret;
  47359 }
  47360 __ai __attribute__((target("neon"))) uint64x1_t vclt_f64(float64x1_t __p0, float64x1_t __p1) {
  47361   uint64x1_t __ret;
  47362   __ret = (uint64x1_t)(__p0 < __p1);
  47363   return __ret;
  47364 }
  47365 __ai __attribute__((target("neon"))) uint64x1_t vclt_s64(int64x1_t __p0, int64x1_t __p1) {
  47366   uint64x1_t __ret;
  47367   __ret = (uint64x1_t)(__p0 < __p1);
  47368   return __ret;
  47369 }
  47370 __ai __attribute__((target("neon"))) uint64_t vcltd_u64(uint64_t __p0, uint64_t __p1) {
  47371   uint64_t __ret;
  47372   __ret = (uint64_t) __builtin_neon_vcltd_u64(__p0, __p1);
  47373   return __ret;
  47374 }
  47375 __ai __attribute__((target("neon"))) uint64_t vcltd_s64(int64_t __p0, int64_t __p1) {
  47376   uint64_t __ret;
  47377   __ret = (uint64_t) __builtin_neon_vcltd_s64(__p0, __p1);
  47378   return __ret;
  47379 }
  47380 __ai __attribute__((target("neon"))) uint64_t vcltd_f64(float64_t __p0, float64_t __p1) {
  47381   uint64_t __ret;
  47382   __ret = (uint64_t) __builtin_neon_vcltd_f64(__p0, __p1);
  47383   return __ret;
  47384 }
  47385 __ai __attribute__((target("neon"))) uint32_t vclts_f32(float32_t __p0, float32_t __p1) {
  47386   uint32_t __ret;
  47387   __ret = (uint32_t) __builtin_neon_vclts_f32(__p0, __p1);
  47388   return __ret;
  47389 }
  47390 #ifdef __LITTLE_ENDIAN__
  47391 __ai __attribute__((target("neon"))) uint8x16_t vcltzq_s8(int8x16_t __p0) {
  47392   uint8x16_t __ret;
  47393   __ret = (uint8x16_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 48);
  47394   return __ret;
  47395 }
  47396 #else
  47397 __ai __attribute__((target("neon"))) uint8x16_t vcltzq_s8(int8x16_t __p0) {
  47398   uint8x16_t __ret;
  47399   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  47400   __ret = (uint8x16_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 48);
  47401   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  47402   return __ret;
  47403 }
  47404 #endif
  47405 
  47406 #ifdef __LITTLE_ENDIAN__
  47407 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_f64(float64x2_t __p0) {
  47408   uint64x2_t __ret;
  47409   __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 51);
  47410   return __ret;
  47411 }
  47412 #else
  47413 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_f64(float64x2_t __p0) {
  47414   uint64x2_t __ret;
  47415   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47416   __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 51);
  47417   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47418   return __ret;
  47419 }
  47420 #endif
  47421 
  47422 #ifdef __LITTLE_ENDIAN__
  47423 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_f32(float32x4_t __p0) {
  47424   uint32x4_t __ret;
  47425   __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 50);
  47426   return __ret;
  47427 }
  47428 #else
  47429 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_f32(float32x4_t __p0) {
  47430   uint32x4_t __ret;
  47431   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47432   __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 50);
  47433   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47434   return __ret;
  47435 }
  47436 #endif
  47437 
  47438 #ifdef __LITTLE_ENDIAN__
  47439 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_s32(int32x4_t __p0) {
  47440   uint32x4_t __ret;
  47441   __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 50);
  47442   return __ret;
  47443 }
  47444 #else
  47445 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_s32(int32x4_t __p0) {
  47446   uint32x4_t __ret;
  47447   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47448   __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 50);
  47449   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47450   return __ret;
  47451 }
  47452 #endif
  47453 
  47454 #ifdef __LITTLE_ENDIAN__
  47455 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_s64(int64x2_t __p0) {
  47456   uint64x2_t __ret;
  47457   __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 51);
  47458   return __ret;
  47459 }
  47460 #else
  47461 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_s64(int64x2_t __p0) {
  47462   uint64x2_t __ret;
  47463   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47464   __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 51);
  47465   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47466   return __ret;
  47467 }
  47468 #endif
  47469 
  47470 #ifdef __LITTLE_ENDIAN__
  47471 __ai __attribute__((target("neon"))) uint16x8_t vcltzq_s16(int16x8_t __p0) {
  47472   uint16x8_t __ret;
  47473   __ret = (uint16x8_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 49);
  47474   return __ret;
  47475 }
  47476 #else
  47477 __ai __attribute__((target("neon"))) uint16x8_t vcltzq_s16(int16x8_t __p0) {
  47478   uint16x8_t __ret;
  47479   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  47480   __ret = (uint16x8_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 49);
  47481   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  47482   return __ret;
  47483 }
  47484 #endif
  47485 
  47486 #ifdef __LITTLE_ENDIAN__
  47487 __ai __attribute__((target("neon"))) uint8x8_t vcltz_s8(int8x8_t __p0) {
  47488   uint8x8_t __ret;
  47489   __ret = (uint8x8_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 16);
  47490   return __ret;
  47491 }
  47492 #else
  47493 __ai __attribute__((target("neon"))) uint8x8_t vcltz_s8(int8x8_t __p0) {
  47494   uint8x8_t __ret;
  47495   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  47496   __ret = (uint8x8_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 16);
  47497   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  47498   return __ret;
  47499 }
  47500 #endif
  47501 
  47502 __ai __attribute__((target("neon"))) uint64x1_t vcltz_f64(float64x1_t __p0) {
  47503   uint64x1_t __ret;
  47504   __ret = (uint64x1_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 19);
  47505   return __ret;
  47506 }
  47507 #ifdef __LITTLE_ENDIAN__
  47508 __ai __attribute__((target("neon"))) uint32x2_t vcltz_f32(float32x2_t __p0) {
  47509   uint32x2_t __ret;
  47510   __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 18);
  47511   return __ret;
  47512 }
  47513 #else
  47514 __ai __attribute__((target("neon"))) uint32x2_t vcltz_f32(float32x2_t __p0) {
  47515   uint32x2_t __ret;
  47516   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47517   __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 18);
  47518   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47519   return __ret;
  47520 }
  47521 #endif
  47522 
  47523 #ifdef __LITTLE_ENDIAN__
  47524 __ai __attribute__((target("neon"))) uint32x2_t vcltz_s32(int32x2_t __p0) {
  47525   uint32x2_t __ret;
  47526   __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 18);
  47527   return __ret;
  47528 }
  47529 #else
  47530 __ai __attribute__((target("neon"))) uint32x2_t vcltz_s32(int32x2_t __p0) {
  47531   uint32x2_t __ret;
  47532   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  47533   __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 18);
  47534   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47535   return __ret;
  47536 }
  47537 #endif
  47538 
  47539 __ai __attribute__((target("neon"))) uint64x1_t vcltz_s64(int64x1_t __p0) {
  47540   uint64x1_t __ret;
  47541   __ret = (uint64x1_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 19);
  47542   return __ret;
  47543 }
  47544 #ifdef __LITTLE_ENDIAN__
  47545 __ai __attribute__((target("neon"))) uint16x4_t vcltz_s16(int16x4_t __p0) {
  47546   uint16x4_t __ret;
  47547   __ret = (uint16x4_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 17);
  47548   return __ret;
  47549 }
  47550 #else
  47551 __ai __attribute__((target("neon"))) uint16x4_t vcltz_s16(int16x4_t __p0) {
  47552   uint16x4_t __ret;
  47553   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  47554   __ret = (uint16x4_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 17);
  47555   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  47556   return __ret;
  47557 }
  47558 #endif
  47559 
  47560 __ai __attribute__((target("neon"))) uint64_t vcltzd_s64(int64_t __p0) {
  47561   uint64_t __ret;
  47562   __ret = (uint64_t) __builtin_neon_vcltzd_s64(__p0);
  47563   return __ret;
  47564 }
  47565 __ai __attribute__((target("neon"))) uint64_t vcltzd_f64(float64_t __p0) {
  47566   uint64_t __ret;
  47567   __ret = (uint64_t) __builtin_neon_vcltzd_f64(__p0);
  47568   return __ret;
  47569 }
  47570 __ai __attribute__((target("neon"))) uint32_t vcltzs_f32(float32_t __p0) {
  47571   uint32_t __ret;
  47572   __ret = (uint32_t) __builtin_neon_vcltzs_f32(__p0);
  47573   return __ret;
  47574 }
  47575 #ifdef __LITTLE_ENDIAN__
  47576 __ai __attribute__((target("neon"))) poly64x2_t vcombine_p64(poly64x1_t __p0, poly64x1_t __p1) {
  47577   poly64x2_t __ret;
  47578   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
  47579   return __ret;
  47580 }
  47581 #else
  47582 __ai __attribute__((target("neon"))) poly64x2_t vcombine_p64(poly64x1_t __p0, poly64x1_t __p1) {
  47583   poly64x2_t __ret;
  47584   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
  47585   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47586   return __ret;
  47587 }
  47588 #endif
  47589 
  47590 #ifdef __LITTLE_ENDIAN__
  47591 __ai __attribute__((target("neon"))) float64x2_t vcombine_f64(float64x1_t __p0, float64x1_t __p1) {
  47592   float64x2_t __ret;
  47593   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
  47594   return __ret;
  47595 }
  47596 #else
  47597 __ai __attribute__((target("neon"))) float64x2_t vcombine_f64(float64x1_t __p0, float64x1_t __p1) {
  47598   float64x2_t __ret;
  47599   __ret = __builtin_shufflevector(__p0, __p1, 0, 1);
  47600   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  47601   return __ret;
  47602 }
  47603 #endif
  47604 
  47605 #ifdef __LITTLE_ENDIAN__
  47606 #define vcopyq_lane_p8(__p0_278, __p1_278, __p2_278, __p3_278) __extension__ ({ \
  47607   poly8x16_t __ret_278; \
  47608   poly8x16_t __s0_278 = __p0_278; \
  47609   poly8x8_t __s2_278 = __p2_278; \
  47610   __ret_278 = vsetq_lane_p8(vget_lane_p8(__s2_278, __p3_278), __s0_278, __p1_278); \
  47611   __ret_278; \
  47612 })
  47613 #else
  47614 #define vcopyq_lane_p8(__p0_279, __p1_279, __p2_279, __p3_279) __extension__ ({ \
  47615   poly8x16_t __ret_279; \
  47616   poly8x16_t __s0_279 = __p0_279; \
  47617   poly8x8_t __s2_279 = __p2_279; \
  47618   poly8x16_t __rev0_279;  __rev0_279 = __builtin_shufflevector(__s0_279, __s0_279, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  47619   poly8x8_t __rev2_279;  __rev2_279 = __builtin_shufflevector(__s2_279, __s2_279, 7, 6, 5, 4, 3, 2, 1, 0); \
  47620   __ret_279 = __noswap_vsetq_lane_p8(__noswap_vget_lane_p8(__rev2_279, __p3_279), __rev0_279, __p1_279); \
  47621   __ret_279 = __builtin_shufflevector(__ret_279, __ret_279, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  47622   __ret_279; \
  47623 })
  47624 #endif
  47625 
  47626 #ifdef __LITTLE_ENDIAN__
  47627 #define vcopyq_lane_p16(__p0_280, __p1_280, __p2_280, __p3_280) __extension__ ({ \
  47628   poly16x8_t __ret_280; \
  47629   poly16x8_t __s0_280 = __p0_280; \
  47630   poly16x4_t __s2_280 = __p2_280; \
  47631   __ret_280 = vsetq_lane_p16(vget_lane_p16(__s2_280, __p3_280), __s0_280, __p1_280); \
  47632   __ret_280; \
  47633 })
  47634 #else
  47635 #define vcopyq_lane_p16(__p0_281, __p1_281, __p2_281, __p3_281) __extension__ ({ \
  47636   poly16x8_t __ret_281; \
  47637   poly16x8_t __s0_281 = __p0_281; \
  47638   poly16x4_t __s2_281 = __p2_281; \
  47639   poly16x8_t __rev0_281;  __rev0_281 = __builtin_shufflevector(__s0_281, __s0_281, 7, 6, 5, 4, 3, 2, 1, 0); \
  47640   poly16x4_t __rev2_281;  __rev2_281 = __builtin_shufflevector(__s2_281, __s2_281, 3, 2, 1, 0); \
  47641   __ret_281 = __noswap_vsetq_lane_p16(__noswap_vget_lane_p16(__rev2_281, __p3_281), __rev0_281, __p1_281); \
  47642   __ret_281 = __builtin_shufflevector(__ret_281, __ret_281, 7, 6, 5, 4, 3, 2, 1, 0); \
  47643   __ret_281; \
  47644 })
  47645 #endif
  47646 
  47647 #ifdef __LITTLE_ENDIAN__
  47648 #define vcopyq_lane_u8(__p0_282, __p1_282, __p2_282, __p3_282) __extension__ ({ \
  47649   uint8x16_t __ret_282; \
  47650   uint8x16_t __s0_282 = __p0_282; \
  47651   uint8x8_t __s2_282 = __p2_282; \
  47652   __ret_282 = vsetq_lane_u8(vget_lane_u8(__s2_282, __p3_282), __s0_282, __p1_282); \
  47653   __ret_282; \
  47654 })
  47655 #else
  47656 #define vcopyq_lane_u8(__p0_283, __p1_283, __p2_283, __p3_283) __extension__ ({ \
  47657   uint8x16_t __ret_283; \
  47658   uint8x16_t __s0_283 = __p0_283; \
  47659   uint8x8_t __s2_283 = __p2_283; \
  47660   uint8x16_t __rev0_283;  __rev0_283 = __builtin_shufflevector(__s0_283, __s0_283, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  47661   uint8x8_t __rev2_283;  __rev2_283 = __builtin_shufflevector(__s2_283, __s2_283, 7, 6, 5, 4, 3, 2, 1, 0); \
  47662   __ret_283 = __noswap_vsetq_lane_u8(__noswap_vget_lane_u8(__rev2_283, __p3_283), __rev0_283, __p1_283); \
  47663   __ret_283 = __builtin_shufflevector(__ret_283, __ret_283, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  47664   __ret_283; \
  47665 })
  47666 #endif
  47667 
  47668 #ifdef __LITTLE_ENDIAN__
  47669 #define vcopyq_lane_u32(__p0_284, __p1_284, __p2_284, __p3_284) __extension__ ({ \
  47670   uint32x4_t __ret_284; \
  47671   uint32x4_t __s0_284 = __p0_284; \
  47672   uint32x2_t __s2_284 = __p2_284; \
  47673   __ret_284 = vsetq_lane_u32(vget_lane_u32(__s2_284, __p3_284), __s0_284, __p1_284); \
  47674   __ret_284; \
  47675 })
  47676 #else
  47677 #define vcopyq_lane_u32(__p0_285, __p1_285, __p2_285, __p3_285) __extension__ ({ \
  47678   uint32x4_t __ret_285; \
  47679   uint32x4_t __s0_285 = __p0_285; \
  47680   uint32x2_t __s2_285 = __p2_285; \
  47681   uint32x4_t __rev0_285;  __rev0_285 = __builtin_shufflevector(__s0_285, __s0_285, 3, 2, 1, 0); \
  47682   uint32x2_t __rev2_285;  __rev2_285 = __builtin_shufflevector(__s2_285, __s2_285, 1, 0); \
  47683   __ret_285 = __noswap_vsetq_lane_u32(__noswap_vget_lane_u32(__rev2_285, __p3_285), __rev0_285, __p1_285); \
  47684   __ret_285 = __builtin_shufflevector(__ret_285, __ret_285, 3, 2, 1, 0); \
  47685   __ret_285; \
  47686 })
  47687 #endif
  47688 
  47689 #ifdef __LITTLE_ENDIAN__
  47690 #define vcopyq_lane_u64(__p0_286, __p1_286, __p2_286, __p3_286) __extension__ ({ \
  47691   uint64x2_t __ret_286; \
  47692   uint64x2_t __s0_286 = __p0_286; \
  47693   uint64x1_t __s2_286 = __p2_286; \
  47694   __ret_286 = vsetq_lane_u64(vget_lane_u64(__s2_286, __p3_286), __s0_286, __p1_286); \
  47695   __ret_286; \
  47696 })
  47697 #else
  47698 #define vcopyq_lane_u64(__p0_287, __p1_287, __p2_287, __p3_287) __extension__ ({ \
  47699   uint64x2_t __ret_287; \
  47700   uint64x2_t __s0_287 = __p0_287; \
  47701   uint64x1_t __s2_287 = __p2_287; \
  47702   uint64x2_t __rev0_287;  __rev0_287 = __builtin_shufflevector(__s0_287, __s0_287, 1, 0); \
  47703   __ret_287 = __noswap_vsetq_lane_u64(vget_lane_u64(__s2_287, __p3_287), __rev0_287, __p1_287); \
  47704   __ret_287 = __builtin_shufflevector(__ret_287, __ret_287, 1, 0); \
  47705   __ret_287; \
  47706 })
  47707 #endif
  47708 
  47709 #ifdef __LITTLE_ENDIAN__
  47710 #define vcopyq_lane_u16(__p0_288, __p1_288, __p2_288, __p3_288) __extension__ ({ \
  47711   uint16x8_t __ret_288; \
  47712   uint16x8_t __s0_288 = __p0_288; \
  47713   uint16x4_t __s2_288 = __p2_288; \
  47714   __ret_288 = vsetq_lane_u16(vget_lane_u16(__s2_288, __p3_288), __s0_288, __p1_288); \
  47715   __ret_288; \
  47716 })
  47717 #else
  47718 #define vcopyq_lane_u16(__p0_289, __p1_289, __p2_289, __p3_289) __extension__ ({ \
  47719   uint16x8_t __ret_289; \
  47720   uint16x8_t __s0_289 = __p0_289; \
  47721   uint16x4_t __s2_289 = __p2_289; \
  47722   uint16x8_t __rev0_289;  __rev0_289 = __builtin_shufflevector(__s0_289, __s0_289, 7, 6, 5, 4, 3, 2, 1, 0); \
  47723   uint16x4_t __rev2_289;  __rev2_289 = __builtin_shufflevector(__s2_289, __s2_289, 3, 2, 1, 0); \
  47724   __ret_289 = __noswap_vsetq_lane_u16(__noswap_vget_lane_u16(__rev2_289, __p3_289), __rev0_289, __p1_289); \
  47725   __ret_289 = __builtin_shufflevector(__ret_289, __ret_289, 7, 6, 5, 4, 3, 2, 1, 0); \
  47726   __ret_289; \
  47727 })
  47728 #endif
  47729 
  47730 #ifdef __LITTLE_ENDIAN__
  47731 #define vcopyq_lane_s8(__p0_290, __p1_290, __p2_290, __p3_290) __extension__ ({ \
  47732   int8x16_t __ret_290; \
  47733   int8x16_t __s0_290 = __p0_290; \
  47734   int8x8_t __s2_290 = __p2_290; \
  47735   __ret_290 = vsetq_lane_s8(vget_lane_s8(__s2_290, __p3_290), __s0_290, __p1_290); \
  47736   __ret_290; \
  47737 })
  47738 #else
  47739 #define vcopyq_lane_s8(__p0_291, __p1_291, __p2_291, __p3_291) __extension__ ({ \
  47740   int8x16_t __ret_291; \
  47741   int8x16_t __s0_291 = __p0_291; \
  47742   int8x8_t __s2_291 = __p2_291; \
  47743   int8x16_t __rev0_291;  __rev0_291 = __builtin_shufflevector(__s0_291, __s0_291, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  47744   int8x8_t __rev2_291;  __rev2_291 = __builtin_shufflevector(__s2_291, __s2_291, 7, 6, 5, 4, 3, 2, 1, 0); \
  47745   __ret_291 = __noswap_vsetq_lane_s8(__noswap_vget_lane_s8(__rev2_291, __p3_291), __rev0_291, __p1_291); \
  47746   __ret_291 = __builtin_shufflevector(__ret_291, __ret_291, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  47747   __ret_291; \
  47748 })
  47749 #endif
  47750 
  47751 #ifdef __LITTLE_ENDIAN__
  47752 #define vcopyq_lane_f32(__p0_292, __p1_292, __p2_292, __p3_292) __extension__ ({ \
  47753   float32x4_t __ret_292; \
  47754   float32x4_t __s0_292 = __p0_292; \
  47755   float32x2_t __s2_292 = __p2_292; \
  47756   __ret_292 = vsetq_lane_f32(vget_lane_f32(__s2_292, __p3_292), __s0_292, __p1_292); \
  47757   __ret_292; \
  47758 })
  47759 #else
  47760 #define vcopyq_lane_f32(__p0_293, __p1_293, __p2_293, __p3_293) __extension__ ({ \
  47761   float32x4_t __ret_293; \
  47762   float32x4_t __s0_293 = __p0_293; \
  47763   float32x2_t __s2_293 = __p2_293; \
  47764   float32x4_t __rev0_293;  __rev0_293 = __builtin_shufflevector(__s0_293, __s0_293, 3, 2, 1, 0); \
  47765   float32x2_t __rev2_293;  __rev2_293 = __builtin_shufflevector(__s2_293, __s2_293, 1, 0); \
  47766   __ret_293 = __noswap_vsetq_lane_f32(__noswap_vget_lane_f32(__rev2_293, __p3_293), __rev0_293, __p1_293); \
  47767   __ret_293 = __builtin_shufflevector(__ret_293, __ret_293, 3, 2, 1, 0); \
  47768   __ret_293; \
  47769 })
  47770 #endif
  47771 
  47772 #ifdef __LITTLE_ENDIAN__
  47773 #define vcopyq_lane_s32(__p0_294, __p1_294, __p2_294, __p3_294) __extension__ ({ \
  47774   int32x4_t __ret_294; \
  47775   int32x4_t __s0_294 = __p0_294; \
  47776   int32x2_t __s2_294 = __p2_294; \
  47777   __ret_294 = vsetq_lane_s32(vget_lane_s32(__s2_294, __p3_294), __s0_294, __p1_294); \
  47778   __ret_294; \
  47779 })
  47780 #else
  47781 #define vcopyq_lane_s32(__p0_295, __p1_295, __p2_295, __p3_295) __extension__ ({ \
  47782   int32x4_t __ret_295; \
  47783   int32x4_t __s0_295 = __p0_295; \
  47784   int32x2_t __s2_295 = __p2_295; \
  47785   int32x4_t __rev0_295;  __rev0_295 = __builtin_shufflevector(__s0_295, __s0_295, 3, 2, 1, 0); \
  47786   int32x2_t __rev2_295;  __rev2_295 = __builtin_shufflevector(__s2_295, __s2_295, 1, 0); \
  47787   __ret_295 = __noswap_vsetq_lane_s32(__noswap_vget_lane_s32(__rev2_295, __p3_295), __rev0_295, __p1_295); \
  47788   __ret_295 = __builtin_shufflevector(__ret_295, __ret_295, 3, 2, 1, 0); \
  47789   __ret_295; \
  47790 })
  47791 #endif
  47792 
  47793 #ifdef __LITTLE_ENDIAN__
  47794 #define vcopyq_lane_s64(__p0_296, __p1_296, __p2_296, __p3_296) __extension__ ({ \
  47795   int64x2_t __ret_296; \
  47796   int64x2_t __s0_296 = __p0_296; \
  47797   int64x1_t __s2_296 = __p2_296; \
  47798   __ret_296 = vsetq_lane_s64(vget_lane_s64(__s2_296, __p3_296), __s0_296, __p1_296); \
  47799   __ret_296; \
  47800 })
  47801 #else
  47802 #define vcopyq_lane_s64(__p0_297, __p1_297, __p2_297, __p3_297) __extension__ ({ \
  47803   int64x2_t __ret_297; \
  47804   int64x2_t __s0_297 = __p0_297; \
  47805   int64x1_t __s2_297 = __p2_297; \
  47806   int64x2_t __rev0_297;  __rev0_297 = __builtin_shufflevector(__s0_297, __s0_297, 1, 0); \
  47807   __ret_297 = __noswap_vsetq_lane_s64(vget_lane_s64(__s2_297, __p3_297), __rev0_297, __p1_297); \
  47808   __ret_297 = __builtin_shufflevector(__ret_297, __ret_297, 1, 0); \
  47809   __ret_297; \
  47810 })
  47811 #endif
  47812 
  47813 #ifdef __LITTLE_ENDIAN__
  47814 #define vcopyq_lane_s16(__p0_298, __p1_298, __p2_298, __p3_298) __extension__ ({ \
  47815   int16x8_t __ret_298; \
  47816   int16x8_t __s0_298 = __p0_298; \
  47817   int16x4_t __s2_298 = __p2_298; \
  47818   __ret_298 = vsetq_lane_s16(vget_lane_s16(__s2_298, __p3_298), __s0_298, __p1_298); \
  47819   __ret_298; \
  47820 })
  47821 #else
  47822 #define vcopyq_lane_s16(__p0_299, __p1_299, __p2_299, __p3_299) __extension__ ({ \
  47823   int16x8_t __ret_299; \
  47824   int16x8_t __s0_299 = __p0_299; \
  47825   int16x4_t __s2_299 = __p2_299; \
  47826   int16x8_t __rev0_299;  __rev0_299 = __builtin_shufflevector(__s0_299, __s0_299, 7, 6, 5, 4, 3, 2, 1, 0); \
  47827   int16x4_t __rev2_299;  __rev2_299 = __builtin_shufflevector(__s2_299, __s2_299, 3, 2, 1, 0); \
  47828   __ret_299 = __noswap_vsetq_lane_s16(__noswap_vget_lane_s16(__rev2_299, __p3_299), __rev0_299, __p1_299); \
  47829   __ret_299 = __builtin_shufflevector(__ret_299, __ret_299, 7, 6, 5, 4, 3, 2, 1, 0); \
  47830   __ret_299; \
  47831 })
  47832 #endif
  47833 
  47834 #ifdef __LITTLE_ENDIAN__
  47835 #define vcopy_lane_p8(__p0_300, __p1_300, __p2_300, __p3_300) __extension__ ({ \
  47836   poly8x8_t __ret_300; \
  47837   poly8x8_t __s0_300 = __p0_300; \
  47838   poly8x8_t __s2_300 = __p2_300; \
  47839   __ret_300 = vset_lane_p8(vget_lane_p8(__s2_300, __p3_300), __s0_300, __p1_300); \
  47840   __ret_300; \
  47841 })
  47842 #else
  47843 #define vcopy_lane_p8(__p0_301, __p1_301, __p2_301, __p3_301) __extension__ ({ \
  47844   poly8x8_t __ret_301; \
  47845   poly8x8_t __s0_301 = __p0_301; \
  47846   poly8x8_t __s2_301 = __p2_301; \
  47847   poly8x8_t __rev0_301;  __rev0_301 = __builtin_shufflevector(__s0_301, __s0_301, 7, 6, 5, 4, 3, 2, 1, 0); \
  47848   poly8x8_t __rev2_301;  __rev2_301 = __builtin_shufflevector(__s2_301, __s2_301, 7, 6, 5, 4, 3, 2, 1, 0); \
  47849   __ret_301 = __noswap_vset_lane_p8(__noswap_vget_lane_p8(__rev2_301, __p3_301), __rev0_301, __p1_301); \
  47850   __ret_301 = __builtin_shufflevector(__ret_301, __ret_301, 7, 6, 5, 4, 3, 2, 1, 0); \
  47851   __ret_301; \
  47852 })
  47853 #endif
  47854 
  47855 #ifdef __LITTLE_ENDIAN__
  47856 #define vcopy_lane_p16(__p0_302, __p1_302, __p2_302, __p3_302) __extension__ ({ \
  47857   poly16x4_t __ret_302; \
  47858   poly16x4_t __s0_302 = __p0_302; \
  47859   poly16x4_t __s2_302 = __p2_302; \
  47860   __ret_302 = vset_lane_p16(vget_lane_p16(__s2_302, __p3_302), __s0_302, __p1_302); \
  47861   __ret_302; \
  47862 })
  47863 #else
  47864 #define vcopy_lane_p16(__p0_303, __p1_303, __p2_303, __p3_303) __extension__ ({ \
  47865   poly16x4_t __ret_303; \
  47866   poly16x4_t __s0_303 = __p0_303; \
  47867   poly16x4_t __s2_303 = __p2_303; \
  47868   poly16x4_t __rev0_303;  __rev0_303 = __builtin_shufflevector(__s0_303, __s0_303, 3, 2, 1, 0); \
  47869   poly16x4_t __rev2_303;  __rev2_303 = __builtin_shufflevector(__s2_303, __s2_303, 3, 2, 1, 0); \
  47870   __ret_303 = __noswap_vset_lane_p16(__noswap_vget_lane_p16(__rev2_303, __p3_303), __rev0_303, __p1_303); \
  47871   __ret_303 = __builtin_shufflevector(__ret_303, __ret_303, 3, 2, 1, 0); \
  47872   __ret_303; \
  47873 })
  47874 #endif
  47875 
  47876 #ifdef __LITTLE_ENDIAN__
  47877 #define vcopy_lane_u8(__p0_304, __p1_304, __p2_304, __p3_304) __extension__ ({ \
  47878   uint8x8_t __ret_304; \
  47879   uint8x8_t __s0_304 = __p0_304; \
  47880   uint8x8_t __s2_304 = __p2_304; \
  47881   __ret_304 = vset_lane_u8(vget_lane_u8(__s2_304, __p3_304), __s0_304, __p1_304); \
  47882   __ret_304; \
  47883 })
  47884 #else
  47885 #define vcopy_lane_u8(__p0_305, __p1_305, __p2_305, __p3_305) __extension__ ({ \
  47886   uint8x8_t __ret_305; \
  47887   uint8x8_t __s0_305 = __p0_305; \
  47888   uint8x8_t __s2_305 = __p2_305; \
  47889   uint8x8_t __rev0_305;  __rev0_305 = __builtin_shufflevector(__s0_305, __s0_305, 7, 6, 5, 4, 3, 2, 1, 0); \
  47890   uint8x8_t __rev2_305;  __rev2_305 = __builtin_shufflevector(__s2_305, __s2_305, 7, 6, 5, 4, 3, 2, 1, 0); \
  47891   __ret_305 = __noswap_vset_lane_u8(__noswap_vget_lane_u8(__rev2_305, __p3_305), __rev0_305, __p1_305); \
  47892   __ret_305 = __builtin_shufflevector(__ret_305, __ret_305, 7, 6, 5, 4, 3, 2, 1, 0); \
  47893   __ret_305; \
  47894 })
  47895 #endif
  47896 
  47897 #ifdef __LITTLE_ENDIAN__
  47898 #define vcopy_lane_u32(__p0_306, __p1_306, __p2_306, __p3_306) __extension__ ({ \
  47899   uint32x2_t __ret_306; \
  47900   uint32x2_t __s0_306 = __p0_306; \
  47901   uint32x2_t __s2_306 = __p2_306; \
  47902   __ret_306 = vset_lane_u32(vget_lane_u32(__s2_306, __p3_306), __s0_306, __p1_306); \
  47903   __ret_306; \
  47904 })
  47905 #else
  47906 #define vcopy_lane_u32(__p0_307, __p1_307, __p2_307, __p3_307) __extension__ ({ \
  47907   uint32x2_t __ret_307; \
  47908   uint32x2_t __s0_307 = __p0_307; \
  47909   uint32x2_t __s2_307 = __p2_307; \
  47910   uint32x2_t __rev0_307;  __rev0_307 = __builtin_shufflevector(__s0_307, __s0_307, 1, 0); \
  47911   uint32x2_t __rev2_307;  __rev2_307 = __builtin_shufflevector(__s2_307, __s2_307, 1, 0); \
  47912   __ret_307 = __noswap_vset_lane_u32(__noswap_vget_lane_u32(__rev2_307, __p3_307), __rev0_307, __p1_307); \
  47913   __ret_307 = __builtin_shufflevector(__ret_307, __ret_307, 1, 0); \
  47914   __ret_307; \
  47915 })
  47916 #endif
  47917 
  47918 #define vcopy_lane_u64(__p0_308, __p1_308, __p2_308, __p3_308) __extension__ ({ \
  47919   uint64x1_t __ret_308; \
  47920   uint64x1_t __s0_308 = __p0_308; \
  47921   uint64x1_t __s2_308 = __p2_308; \
  47922   __ret_308 = vset_lane_u64(vget_lane_u64(__s2_308, __p3_308), __s0_308, __p1_308); \
  47923   __ret_308; \
  47924 })
  47925 #ifdef __LITTLE_ENDIAN__
  47926 #define vcopy_lane_u16(__p0_309, __p1_309, __p2_309, __p3_309) __extension__ ({ \
  47927   uint16x4_t __ret_309; \
  47928   uint16x4_t __s0_309 = __p0_309; \
  47929   uint16x4_t __s2_309 = __p2_309; \
  47930   __ret_309 = vset_lane_u16(vget_lane_u16(__s2_309, __p3_309), __s0_309, __p1_309); \
  47931   __ret_309; \
  47932 })
  47933 #else
  47934 #define vcopy_lane_u16(__p0_310, __p1_310, __p2_310, __p3_310) __extension__ ({ \
  47935   uint16x4_t __ret_310; \
  47936   uint16x4_t __s0_310 = __p0_310; \
  47937   uint16x4_t __s2_310 = __p2_310; \
  47938   uint16x4_t __rev0_310;  __rev0_310 = __builtin_shufflevector(__s0_310, __s0_310, 3, 2, 1, 0); \
  47939   uint16x4_t __rev2_310;  __rev2_310 = __builtin_shufflevector(__s2_310, __s2_310, 3, 2, 1, 0); \
  47940   __ret_310 = __noswap_vset_lane_u16(__noswap_vget_lane_u16(__rev2_310, __p3_310), __rev0_310, __p1_310); \
  47941   __ret_310 = __builtin_shufflevector(__ret_310, __ret_310, 3, 2, 1, 0); \
  47942   __ret_310; \
  47943 })
  47944 #endif
  47945 
  47946 #ifdef __LITTLE_ENDIAN__
  47947 #define vcopy_lane_s8(__p0_311, __p1_311, __p2_311, __p3_311) __extension__ ({ \
  47948   int8x8_t __ret_311; \
  47949   int8x8_t __s0_311 = __p0_311; \
  47950   int8x8_t __s2_311 = __p2_311; \
  47951   __ret_311 = vset_lane_s8(vget_lane_s8(__s2_311, __p3_311), __s0_311, __p1_311); \
  47952   __ret_311; \
  47953 })
  47954 #else
  47955 #define vcopy_lane_s8(__p0_312, __p1_312, __p2_312, __p3_312) __extension__ ({ \
  47956   int8x8_t __ret_312; \
  47957   int8x8_t __s0_312 = __p0_312; \
  47958   int8x8_t __s2_312 = __p2_312; \
  47959   int8x8_t __rev0_312;  __rev0_312 = __builtin_shufflevector(__s0_312, __s0_312, 7, 6, 5, 4, 3, 2, 1, 0); \
  47960   int8x8_t __rev2_312;  __rev2_312 = __builtin_shufflevector(__s2_312, __s2_312, 7, 6, 5, 4, 3, 2, 1, 0); \
  47961   __ret_312 = __noswap_vset_lane_s8(__noswap_vget_lane_s8(__rev2_312, __p3_312), __rev0_312, __p1_312); \
  47962   __ret_312 = __builtin_shufflevector(__ret_312, __ret_312, 7, 6, 5, 4, 3, 2, 1, 0); \
  47963   __ret_312; \
  47964 })
  47965 #endif
  47966 
  47967 #ifdef __LITTLE_ENDIAN__
  47968 #define vcopy_lane_f32(__p0_313, __p1_313, __p2_313, __p3_313) __extension__ ({ \
  47969   float32x2_t __ret_313; \
  47970   float32x2_t __s0_313 = __p0_313; \
  47971   float32x2_t __s2_313 = __p2_313; \
  47972   __ret_313 = vset_lane_f32(vget_lane_f32(__s2_313, __p3_313), __s0_313, __p1_313); \
  47973   __ret_313; \
  47974 })
  47975 #else
  47976 #define vcopy_lane_f32(__p0_314, __p1_314, __p2_314, __p3_314) __extension__ ({ \
  47977   float32x2_t __ret_314; \
  47978   float32x2_t __s0_314 = __p0_314; \
  47979   float32x2_t __s2_314 = __p2_314; \
  47980   float32x2_t __rev0_314;  __rev0_314 = __builtin_shufflevector(__s0_314, __s0_314, 1, 0); \
  47981   float32x2_t __rev2_314;  __rev2_314 = __builtin_shufflevector(__s2_314, __s2_314, 1, 0); \
  47982   __ret_314 = __noswap_vset_lane_f32(__noswap_vget_lane_f32(__rev2_314, __p3_314), __rev0_314, __p1_314); \
  47983   __ret_314 = __builtin_shufflevector(__ret_314, __ret_314, 1, 0); \
  47984   __ret_314; \
  47985 })
  47986 #endif
  47987 
  47988 #ifdef __LITTLE_ENDIAN__
  47989 #define vcopy_lane_s32(__p0_315, __p1_315, __p2_315, __p3_315) __extension__ ({ \
  47990   int32x2_t __ret_315; \
  47991   int32x2_t __s0_315 = __p0_315; \
  47992   int32x2_t __s2_315 = __p2_315; \
  47993   __ret_315 = vset_lane_s32(vget_lane_s32(__s2_315, __p3_315), __s0_315, __p1_315); \
  47994   __ret_315; \
  47995 })
  47996 #else
  47997 #define vcopy_lane_s32(__p0_316, __p1_316, __p2_316, __p3_316) __extension__ ({ \
  47998   int32x2_t __ret_316; \
  47999   int32x2_t __s0_316 = __p0_316; \
  48000   int32x2_t __s2_316 = __p2_316; \
  48001   int32x2_t __rev0_316;  __rev0_316 = __builtin_shufflevector(__s0_316, __s0_316, 1, 0); \
  48002   int32x2_t __rev2_316;  __rev2_316 = __builtin_shufflevector(__s2_316, __s2_316, 1, 0); \
  48003   __ret_316 = __noswap_vset_lane_s32(__noswap_vget_lane_s32(__rev2_316, __p3_316), __rev0_316, __p1_316); \
  48004   __ret_316 = __builtin_shufflevector(__ret_316, __ret_316, 1, 0); \
  48005   __ret_316; \
  48006 })
  48007 #endif
  48008 
  48009 #define vcopy_lane_s64(__p0_317, __p1_317, __p2_317, __p3_317) __extension__ ({ \
  48010   int64x1_t __ret_317; \
  48011   int64x1_t __s0_317 = __p0_317; \
  48012   int64x1_t __s2_317 = __p2_317; \
  48013   __ret_317 = vset_lane_s64(vget_lane_s64(__s2_317, __p3_317), __s0_317, __p1_317); \
  48014   __ret_317; \
  48015 })
  48016 #ifdef __LITTLE_ENDIAN__
  48017 #define vcopy_lane_s16(__p0_318, __p1_318, __p2_318, __p3_318) __extension__ ({ \
  48018   int16x4_t __ret_318; \
  48019   int16x4_t __s0_318 = __p0_318; \
  48020   int16x4_t __s2_318 = __p2_318; \
  48021   __ret_318 = vset_lane_s16(vget_lane_s16(__s2_318, __p3_318), __s0_318, __p1_318); \
  48022   __ret_318; \
  48023 })
  48024 #else
  48025 #define vcopy_lane_s16(__p0_319, __p1_319, __p2_319, __p3_319) __extension__ ({ \
  48026   int16x4_t __ret_319; \
  48027   int16x4_t __s0_319 = __p0_319; \
  48028   int16x4_t __s2_319 = __p2_319; \
  48029   int16x4_t __rev0_319;  __rev0_319 = __builtin_shufflevector(__s0_319, __s0_319, 3, 2, 1, 0); \
  48030   int16x4_t __rev2_319;  __rev2_319 = __builtin_shufflevector(__s2_319, __s2_319, 3, 2, 1, 0); \
  48031   __ret_319 = __noswap_vset_lane_s16(__noswap_vget_lane_s16(__rev2_319, __p3_319), __rev0_319, __p1_319); \
  48032   __ret_319 = __builtin_shufflevector(__ret_319, __ret_319, 3, 2, 1, 0); \
  48033   __ret_319; \
  48034 })
  48035 #endif
  48036 
  48037 #ifdef __LITTLE_ENDIAN__
  48038 #define vcopyq_laneq_p8(__p0_320, __p1_320, __p2_320, __p3_320) __extension__ ({ \
  48039   poly8x16_t __ret_320; \
  48040   poly8x16_t __s0_320 = __p0_320; \
  48041   poly8x16_t __s2_320 = __p2_320; \
  48042   __ret_320 = vsetq_lane_p8(vgetq_lane_p8(__s2_320, __p3_320), __s0_320, __p1_320); \
  48043   __ret_320; \
  48044 })
  48045 #else
  48046 #define vcopyq_laneq_p8(__p0_321, __p1_321, __p2_321, __p3_321) __extension__ ({ \
  48047   poly8x16_t __ret_321; \
  48048   poly8x16_t __s0_321 = __p0_321; \
  48049   poly8x16_t __s2_321 = __p2_321; \
  48050   poly8x16_t __rev0_321;  __rev0_321 = __builtin_shufflevector(__s0_321, __s0_321, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48051   poly8x16_t __rev2_321;  __rev2_321 = __builtin_shufflevector(__s2_321, __s2_321, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48052   __ret_321 = __noswap_vsetq_lane_p8(__noswap_vgetq_lane_p8(__rev2_321, __p3_321), __rev0_321, __p1_321); \
  48053   __ret_321 = __builtin_shufflevector(__ret_321, __ret_321, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48054   __ret_321; \
  48055 })
  48056 #endif
  48057 
  48058 #ifdef __LITTLE_ENDIAN__
  48059 #define vcopyq_laneq_p16(__p0_322, __p1_322, __p2_322, __p3_322) __extension__ ({ \
  48060   poly16x8_t __ret_322; \
  48061   poly16x8_t __s0_322 = __p0_322; \
  48062   poly16x8_t __s2_322 = __p2_322; \
  48063   __ret_322 = vsetq_lane_p16(vgetq_lane_p16(__s2_322, __p3_322), __s0_322, __p1_322); \
  48064   __ret_322; \
  48065 })
  48066 #else
  48067 #define vcopyq_laneq_p16(__p0_323, __p1_323, __p2_323, __p3_323) __extension__ ({ \
  48068   poly16x8_t __ret_323; \
  48069   poly16x8_t __s0_323 = __p0_323; \
  48070   poly16x8_t __s2_323 = __p2_323; \
  48071   poly16x8_t __rev0_323;  __rev0_323 = __builtin_shufflevector(__s0_323, __s0_323, 7, 6, 5, 4, 3, 2, 1, 0); \
  48072   poly16x8_t __rev2_323;  __rev2_323 = __builtin_shufflevector(__s2_323, __s2_323, 7, 6, 5, 4, 3, 2, 1, 0); \
  48073   __ret_323 = __noswap_vsetq_lane_p16(__noswap_vgetq_lane_p16(__rev2_323, __p3_323), __rev0_323, __p1_323); \
  48074   __ret_323 = __builtin_shufflevector(__ret_323, __ret_323, 7, 6, 5, 4, 3, 2, 1, 0); \
  48075   __ret_323; \
  48076 })
  48077 #endif
  48078 
  48079 #ifdef __LITTLE_ENDIAN__
  48080 #define vcopyq_laneq_u8(__p0_324, __p1_324, __p2_324, __p3_324) __extension__ ({ \
  48081   uint8x16_t __ret_324; \
  48082   uint8x16_t __s0_324 = __p0_324; \
  48083   uint8x16_t __s2_324 = __p2_324; \
  48084   __ret_324 = vsetq_lane_u8(vgetq_lane_u8(__s2_324, __p3_324), __s0_324, __p1_324); \
  48085   __ret_324; \
  48086 })
  48087 #else
  48088 #define vcopyq_laneq_u8(__p0_325, __p1_325, __p2_325, __p3_325) __extension__ ({ \
  48089   uint8x16_t __ret_325; \
  48090   uint8x16_t __s0_325 = __p0_325; \
  48091   uint8x16_t __s2_325 = __p2_325; \
  48092   uint8x16_t __rev0_325;  __rev0_325 = __builtin_shufflevector(__s0_325, __s0_325, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48093   uint8x16_t __rev2_325;  __rev2_325 = __builtin_shufflevector(__s2_325, __s2_325, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48094   __ret_325 = __noswap_vsetq_lane_u8(__noswap_vgetq_lane_u8(__rev2_325, __p3_325), __rev0_325, __p1_325); \
  48095   __ret_325 = __builtin_shufflevector(__ret_325, __ret_325, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48096   __ret_325; \
  48097 })
  48098 #endif
  48099 
  48100 #ifdef __LITTLE_ENDIAN__
  48101 #define vcopyq_laneq_u32(__p0_326, __p1_326, __p2_326, __p3_326) __extension__ ({ \
  48102   uint32x4_t __ret_326; \
  48103   uint32x4_t __s0_326 = __p0_326; \
  48104   uint32x4_t __s2_326 = __p2_326; \
  48105   __ret_326 = vsetq_lane_u32(vgetq_lane_u32(__s2_326, __p3_326), __s0_326, __p1_326); \
  48106   __ret_326; \
  48107 })
  48108 #else
  48109 #define vcopyq_laneq_u32(__p0_327, __p1_327, __p2_327, __p3_327) __extension__ ({ \
  48110   uint32x4_t __ret_327; \
  48111   uint32x4_t __s0_327 = __p0_327; \
  48112   uint32x4_t __s2_327 = __p2_327; \
  48113   uint32x4_t __rev0_327;  __rev0_327 = __builtin_shufflevector(__s0_327, __s0_327, 3, 2, 1, 0); \
  48114   uint32x4_t __rev2_327;  __rev2_327 = __builtin_shufflevector(__s2_327, __s2_327, 3, 2, 1, 0); \
  48115   __ret_327 = __noswap_vsetq_lane_u32(__noswap_vgetq_lane_u32(__rev2_327, __p3_327), __rev0_327, __p1_327); \
  48116   __ret_327 = __builtin_shufflevector(__ret_327, __ret_327, 3, 2, 1, 0); \
  48117   __ret_327; \
  48118 })
  48119 #endif
  48120 
  48121 #ifdef __LITTLE_ENDIAN__
  48122 #define vcopyq_laneq_u64(__p0_328, __p1_328, __p2_328, __p3_328) __extension__ ({ \
  48123   uint64x2_t __ret_328; \
  48124   uint64x2_t __s0_328 = __p0_328; \
  48125   uint64x2_t __s2_328 = __p2_328; \
  48126   __ret_328 = vsetq_lane_u64(vgetq_lane_u64(__s2_328, __p3_328), __s0_328, __p1_328); \
  48127   __ret_328; \
  48128 })
  48129 #else
  48130 #define vcopyq_laneq_u64(__p0_329, __p1_329, __p2_329, __p3_329) __extension__ ({ \
  48131   uint64x2_t __ret_329; \
  48132   uint64x2_t __s0_329 = __p0_329; \
  48133   uint64x2_t __s2_329 = __p2_329; \
  48134   uint64x2_t __rev0_329;  __rev0_329 = __builtin_shufflevector(__s0_329, __s0_329, 1, 0); \
  48135   uint64x2_t __rev2_329;  __rev2_329 = __builtin_shufflevector(__s2_329, __s2_329, 1, 0); \
  48136   __ret_329 = __noswap_vsetq_lane_u64(__noswap_vgetq_lane_u64(__rev2_329, __p3_329), __rev0_329, __p1_329); \
  48137   __ret_329 = __builtin_shufflevector(__ret_329, __ret_329, 1, 0); \
  48138   __ret_329; \
  48139 })
  48140 #endif
  48141 
  48142 #ifdef __LITTLE_ENDIAN__
  48143 #define vcopyq_laneq_u16(__p0_330, __p1_330, __p2_330, __p3_330) __extension__ ({ \
  48144   uint16x8_t __ret_330; \
  48145   uint16x8_t __s0_330 = __p0_330; \
  48146   uint16x8_t __s2_330 = __p2_330; \
  48147   __ret_330 = vsetq_lane_u16(vgetq_lane_u16(__s2_330, __p3_330), __s0_330, __p1_330); \
  48148   __ret_330; \
  48149 })
  48150 #else
  48151 #define vcopyq_laneq_u16(__p0_331, __p1_331, __p2_331, __p3_331) __extension__ ({ \
  48152   uint16x8_t __ret_331; \
  48153   uint16x8_t __s0_331 = __p0_331; \
  48154   uint16x8_t __s2_331 = __p2_331; \
  48155   uint16x8_t __rev0_331;  __rev0_331 = __builtin_shufflevector(__s0_331, __s0_331, 7, 6, 5, 4, 3, 2, 1, 0); \
  48156   uint16x8_t __rev2_331;  __rev2_331 = __builtin_shufflevector(__s2_331, __s2_331, 7, 6, 5, 4, 3, 2, 1, 0); \
  48157   __ret_331 = __noswap_vsetq_lane_u16(__noswap_vgetq_lane_u16(__rev2_331, __p3_331), __rev0_331, __p1_331); \
  48158   __ret_331 = __builtin_shufflevector(__ret_331, __ret_331, 7, 6, 5, 4, 3, 2, 1, 0); \
  48159   __ret_331; \
  48160 })
  48161 #endif
  48162 
  48163 #ifdef __LITTLE_ENDIAN__
  48164 #define vcopyq_laneq_s8(__p0_332, __p1_332, __p2_332, __p3_332) __extension__ ({ \
  48165   int8x16_t __ret_332; \
  48166   int8x16_t __s0_332 = __p0_332; \
  48167   int8x16_t __s2_332 = __p2_332; \
  48168   __ret_332 = vsetq_lane_s8(vgetq_lane_s8(__s2_332, __p3_332), __s0_332, __p1_332); \
  48169   __ret_332; \
  48170 })
  48171 #else
  48172 #define vcopyq_laneq_s8(__p0_333, __p1_333, __p2_333, __p3_333) __extension__ ({ \
  48173   int8x16_t __ret_333; \
  48174   int8x16_t __s0_333 = __p0_333; \
  48175   int8x16_t __s2_333 = __p2_333; \
  48176   int8x16_t __rev0_333;  __rev0_333 = __builtin_shufflevector(__s0_333, __s0_333, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48177   int8x16_t __rev2_333;  __rev2_333 = __builtin_shufflevector(__s2_333, __s2_333, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48178   __ret_333 = __noswap_vsetq_lane_s8(__noswap_vgetq_lane_s8(__rev2_333, __p3_333), __rev0_333, __p1_333); \
  48179   __ret_333 = __builtin_shufflevector(__ret_333, __ret_333, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48180   __ret_333; \
  48181 })
  48182 #endif
  48183 
  48184 #ifdef __LITTLE_ENDIAN__
  48185 #define vcopyq_laneq_f32(__p0_334, __p1_334, __p2_334, __p3_334) __extension__ ({ \
  48186   float32x4_t __ret_334; \
  48187   float32x4_t __s0_334 = __p0_334; \
  48188   float32x4_t __s2_334 = __p2_334; \
  48189   __ret_334 = vsetq_lane_f32(vgetq_lane_f32(__s2_334, __p3_334), __s0_334, __p1_334); \
  48190   __ret_334; \
  48191 })
  48192 #else
  48193 #define vcopyq_laneq_f32(__p0_335, __p1_335, __p2_335, __p3_335) __extension__ ({ \
  48194   float32x4_t __ret_335; \
  48195   float32x4_t __s0_335 = __p0_335; \
  48196   float32x4_t __s2_335 = __p2_335; \
  48197   float32x4_t __rev0_335;  __rev0_335 = __builtin_shufflevector(__s0_335, __s0_335, 3, 2, 1, 0); \
  48198   float32x4_t __rev2_335;  __rev2_335 = __builtin_shufflevector(__s2_335, __s2_335, 3, 2, 1, 0); \
  48199   __ret_335 = __noswap_vsetq_lane_f32(__noswap_vgetq_lane_f32(__rev2_335, __p3_335), __rev0_335, __p1_335); \
  48200   __ret_335 = __builtin_shufflevector(__ret_335, __ret_335, 3, 2, 1, 0); \
  48201   __ret_335; \
  48202 })
  48203 #endif
  48204 
  48205 #ifdef __LITTLE_ENDIAN__
  48206 #define vcopyq_laneq_s32(__p0_336, __p1_336, __p2_336, __p3_336) __extension__ ({ \
  48207   int32x4_t __ret_336; \
  48208   int32x4_t __s0_336 = __p0_336; \
  48209   int32x4_t __s2_336 = __p2_336; \
  48210   __ret_336 = vsetq_lane_s32(vgetq_lane_s32(__s2_336, __p3_336), __s0_336, __p1_336); \
  48211   __ret_336; \
  48212 })
  48213 #else
  48214 #define vcopyq_laneq_s32(__p0_337, __p1_337, __p2_337, __p3_337) __extension__ ({ \
  48215   int32x4_t __ret_337; \
  48216   int32x4_t __s0_337 = __p0_337; \
  48217   int32x4_t __s2_337 = __p2_337; \
  48218   int32x4_t __rev0_337;  __rev0_337 = __builtin_shufflevector(__s0_337, __s0_337, 3, 2, 1, 0); \
  48219   int32x4_t __rev2_337;  __rev2_337 = __builtin_shufflevector(__s2_337, __s2_337, 3, 2, 1, 0); \
  48220   __ret_337 = __noswap_vsetq_lane_s32(__noswap_vgetq_lane_s32(__rev2_337, __p3_337), __rev0_337, __p1_337); \
  48221   __ret_337 = __builtin_shufflevector(__ret_337, __ret_337, 3, 2, 1, 0); \
  48222   __ret_337; \
  48223 })
  48224 #endif
  48225 
  48226 #ifdef __LITTLE_ENDIAN__
  48227 #define vcopyq_laneq_s64(__p0_338, __p1_338, __p2_338, __p3_338) __extension__ ({ \
  48228   int64x2_t __ret_338; \
  48229   int64x2_t __s0_338 = __p0_338; \
  48230   int64x2_t __s2_338 = __p2_338; \
  48231   __ret_338 = vsetq_lane_s64(vgetq_lane_s64(__s2_338, __p3_338), __s0_338, __p1_338); \
  48232   __ret_338; \
  48233 })
  48234 #else
  48235 #define vcopyq_laneq_s64(__p0_339, __p1_339, __p2_339, __p3_339) __extension__ ({ \
  48236   int64x2_t __ret_339; \
  48237   int64x2_t __s0_339 = __p0_339; \
  48238   int64x2_t __s2_339 = __p2_339; \
  48239   int64x2_t __rev0_339;  __rev0_339 = __builtin_shufflevector(__s0_339, __s0_339, 1, 0); \
  48240   int64x2_t __rev2_339;  __rev2_339 = __builtin_shufflevector(__s2_339, __s2_339, 1, 0); \
  48241   __ret_339 = __noswap_vsetq_lane_s64(__noswap_vgetq_lane_s64(__rev2_339, __p3_339), __rev0_339, __p1_339); \
  48242   __ret_339 = __builtin_shufflevector(__ret_339, __ret_339, 1, 0); \
  48243   __ret_339; \
  48244 })
  48245 #endif
  48246 
  48247 #ifdef __LITTLE_ENDIAN__
  48248 #define vcopyq_laneq_s16(__p0_340, __p1_340, __p2_340, __p3_340) __extension__ ({ \
  48249   int16x8_t __ret_340; \
  48250   int16x8_t __s0_340 = __p0_340; \
  48251   int16x8_t __s2_340 = __p2_340; \
  48252   __ret_340 = vsetq_lane_s16(vgetq_lane_s16(__s2_340, __p3_340), __s0_340, __p1_340); \
  48253   __ret_340; \
  48254 })
  48255 #else
  48256 #define vcopyq_laneq_s16(__p0_341, __p1_341, __p2_341, __p3_341) __extension__ ({ \
  48257   int16x8_t __ret_341; \
  48258   int16x8_t __s0_341 = __p0_341; \
  48259   int16x8_t __s2_341 = __p2_341; \
  48260   int16x8_t __rev0_341;  __rev0_341 = __builtin_shufflevector(__s0_341, __s0_341, 7, 6, 5, 4, 3, 2, 1, 0); \
  48261   int16x8_t __rev2_341;  __rev2_341 = __builtin_shufflevector(__s2_341, __s2_341, 7, 6, 5, 4, 3, 2, 1, 0); \
  48262   __ret_341 = __noswap_vsetq_lane_s16(__noswap_vgetq_lane_s16(__rev2_341, __p3_341), __rev0_341, __p1_341); \
  48263   __ret_341 = __builtin_shufflevector(__ret_341, __ret_341, 7, 6, 5, 4, 3, 2, 1, 0); \
  48264   __ret_341; \
  48265 })
  48266 #endif
  48267 
  48268 #ifdef __LITTLE_ENDIAN__
  48269 #define vcopy_laneq_p8(__p0_342, __p1_342, __p2_342, __p3_342) __extension__ ({ \
  48270   poly8x8_t __ret_342; \
  48271   poly8x8_t __s0_342 = __p0_342; \
  48272   poly8x16_t __s2_342 = __p2_342; \
  48273   __ret_342 = vset_lane_p8(vgetq_lane_p8(__s2_342, __p3_342), __s0_342, __p1_342); \
  48274   __ret_342; \
  48275 })
  48276 #else
  48277 #define vcopy_laneq_p8(__p0_343, __p1_343, __p2_343, __p3_343) __extension__ ({ \
  48278   poly8x8_t __ret_343; \
  48279   poly8x8_t __s0_343 = __p0_343; \
  48280   poly8x16_t __s2_343 = __p2_343; \
  48281   poly8x8_t __rev0_343;  __rev0_343 = __builtin_shufflevector(__s0_343, __s0_343, 7, 6, 5, 4, 3, 2, 1, 0); \
  48282   poly8x16_t __rev2_343;  __rev2_343 = __builtin_shufflevector(__s2_343, __s2_343, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48283   __ret_343 = __noswap_vset_lane_p8(__noswap_vgetq_lane_p8(__rev2_343, __p3_343), __rev0_343, __p1_343); \
  48284   __ret_343 = __builtin_shufflevector(__ret_343, __ret_343, 7, 6, 5, 4, 3, 2, 1, 0); \
  48285   __ret_343; \
  48286 })
  48287 #endif
  48288 
  48289 #ifdef __LITTLE_ENDIAN__
  48290 #define vcopy_laneq_p16(__p0_344, __p1_344, __p2_344, __p3_344) __extension__ ({ \
  48291   poly16x4_t __ret_344; \
  48292   poly16x4_t __s0_344 = __p0_344; \
  48293   poly16x8_t __s2_344 = __p2_344; \
  48294   __ret_344 = vset_lane_p16(vgetq_lane_p16(__s2_344, __p3_344), __s0_344, __p1_344); \
  48295   __ret_344; \
  48296 })
  48297 #else
  48298 #define vcopy_laneq_p16(__p0_345, __p1_345, __p2_345, __p3_345) __extension__ ({ \
  48299   poly16x4_t __ret_345; \
  48300   poly16x4_t __s0_345 = __p0_345; \
  48301   poly16x8_t __s2_345 = __p2_345; \
  48302   poly16x4_t __rev0_345;  __rev0_345 = __builtin_shufflevector(__s0_345, __s0_345, 3, 2, 1, 0); \
  48303   poly16x8_t __rev2_345;  __rev2_345 = __builtin_shufflevector(__s2_345, __s2_345, 7, 6, 5, 4, 3, 2, 1, 0); \
  48304   __ret_345 = __noswap_vset_lane_p16(__noswap_vgetq_lane_p16(__rev2_345, __p3_345), __rev0_345, __p1_345); \
  48305   __ret_345 = __builtin_shufflevector(__ret_345, __ret_345, 3, 2, 1, 0); \
  48306   __ret_345; \
  48307 })
  48308 #endif
  48309 
  48310 #ifdef __LITTLE_ENDIAN__
  48311 #define vcopy_laneq_u8(__p0_346, __p1_346, __p2_346, __p3_346) __extension__ ({ \
  48312   uint8x8_t __ret_346; \
  48313   uint8x8_t __s0_346 = __p0_346; \
  48314   uint8x16_t __s2_346 = __p2_346; \
  48315   __ret_346 = vset_lane_u8(vgetq_lane_u8(__s2_346, __p3_346), __s0_346, __p1_346); \
  48316   __ret_346; \
  48317 })
  48318 #else
  48319 #define vcopy_laneq_u8(__p0_347, __p1_347, __p2_347, __p3_347) __extension__ ({ \
  48320   uint8x8_t __ret_347; \
  48321   uint8x8_t __s0_347 = __p0_347; \
  48322   uint8x16_t __s2_347 = __p2_347; \
  48323   uint8x8_t __rev0_347;  __rev0_347 = __builtin_shufflevector(__s0_347, __s0_347, 7, 6, 5, 4, 3, 2, 1, 0); \
  48324   uint8x16_t __rev2_347;  __rev2_347 = __builtin_shufflevector(__s2_347, __s2_347, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48325   __ret_347 = __noswap_vset_lane_u8(__noswap_vgetq_lane_u8(__rev2_347, __p3_347), __rev0_347, __p1_347); \
  48326   __ret_347 = __builtin_shufflevector(__ret_347, __ret_347, 7, 6, 5, 4, 3, 2, 1, 0); \
  48327   __ret_347; \
  48328 })
  48329 #endif
  48330 
  48331 #ifdef __LITTLE_ENDIAN__
  48332 #define vcopy_laneq_u32(__p0_348, __p1_348, __p2_348, __p3_348) __extension__ ({ \
  48333   uint32x2_t __ret_348; \
  48334   uint32x2_t __s0_348 = __p0_348; \
  48335   uint32x4_t __s2_348 = __p2_348; \
  48336   __ret_348 = vset_lane_u32(vgetq_lane_u32(__s2_348, __p3_348), __s0_348, __p1_348); \
  48337   __ret_348; \
  48338 })
  48339 #else
  48340 #define vcopy_laneq_u32(__p0_349, __p1_349, __p2_349, __p3_349) __extension__ ({ \
  48341   uint32x2_t __ret_349; \
  48342   uint32x2_t __s0_349 = __p0_349; \
  48343   uint32x4_t __s2_349 = __p2_349; \
  48344   uint32x2_t __rev0_349;  __rev0_349 = __builtin_shufflevector(__s0_349, __s0_349, 1, 0); \
  48345   uint32x4_t __rev2_349;  __rev2_349 = __builtin_shufflevector(__s2_349, __s2_349, 3, 2, 1, 0); \
  48346   __ret_349 = __noswap_vset_lane_u32(__noswap_vgetq_lane_u32(__rev2_349, __p3_349), __rev0_349, __p1_349); \
  48347   __ret_349 = __builtin_shufflevector(__ret_349, __ret_349, 1, 0); \
  48348   __ret_349; \
  48349 })
  48350 #endif
  48351 
  48352 #ifdef __LITTLE_ENDIAN__
  48353 #define vcopy_laneq_u64(__p0_350, __p1_350, __p2_350, __p3_350) __extension__ ({ \
  48354   uint64x1_t __ret_350; \
  48355   uint64x1_t __s0_350 = __p0_350; \
  48356   uint64x2_t __s2_350 = __p2_350; \
  48357   __ret_350 = vset_lane_u64(vgetq_lane_u64(__s2_350, __p3_350), __s0_350, __p1_350); \
  48358   __ret_350; \
  48359 })
  48360 #else
  48361 #define vcopy_laneq_u64(__p0_351, __p1_351, __p2_351, __p3_351) __extension__ ({ \
  48362   uint64x1_t __ret_351; \
  48363   uint64x1_t __s0_351 = __p0_351; \
  48364   uint64x2_t __s2_351 = __p2_351; \
  48365   uint64x2_t __rev2_351;  __rev2_351 = __builtin_shufflevector(__s2_351, __s2_351, 1, 0); \
  48366   __ret_351 = vset_lane_u64(__noswap_vgetq_lane_u64(__rev2_351, __p3_351), __s0_351, __p1_351); \
  48367   __ret_351; \
  48368 })
  48369 #endif
  48370 
  48371 #ifdef __LITTLE_ENDIAN__
  48372 #define vcopy_laneq_u16(__p0_352, __p1_352, __p2_352, __p3_352) __extension__ ({ \
  48373   uint16x4_t __ret_352; \
  48374   uint16x4_t __s0_352 = __p0_352; \
  48375   uint16x8_t __s2_352 = __p2_352; \
  48376   __ret_352 = vset_lane_u16(vgetq_lane_u16(__s2_352, __p3_352), __s0_352, __p1_352); \
  48377   __ret_352; \
  48378 })
  48379 #else
  48380 #define vcopy_laneq_u16(__p0_353, __p1_353, __p2_353, __p3_353) __extension__ ({ \
  48381   uint16x4_t __ret_353; \
  48382   uint16x4_t __s0_353 = __p0_353; \
  48383   uint16x8_t __s2_353 = __p2_353; \
  48384   uint16x4_t __rev0_353;  __rev0_353 = __builtin_shufflevector(__s0_353, __s0_353, 3, 2, 1, 0); \
  48385   uint16x8_t __rev2_353;  __rev2_353 = __builtin_shufflevector(__s2_353, __s2_353, 7, 6, 5, 4, 3, 2, 1, 0); \
  48386   __ret_353 = __noswap_vset_lane_u16(__noswap_vgetq_lane_u16(__rev2_353, __p3_353), __rev0_353, __p1_353); \
  48387   __ret_353 = __builtin_shufflevector(__ret_353, __ret_353, 3, 2, 1, 0); \
  48388   __ret_353; \
  48389 })
  48390 #endif
  48391 
  48392 #ifdef __LITTLE_ENDIAN__
  48393 #define vcopy_laneq_s8(__p0_354, __p1_354, __p2_354, __p3_354) __extension__ ({ \
  48394   int8x8_t __ret_354; \
  48395   int8x8_t __s0_354 = __p0_354; \
  48396   int8x16_t __s2_354 = __p2_354; \
  48397   __ret_354 = vset_lane_s8(vgetq_lane_s8(__s2_354, __p3_354), __s0_354, __p1_354); \
  48398   __ret_354; \
  48399 })
  48400 #else
  48401 #define vcopy_laneq_s8(__p0_355, __p1_355, __p2_355, __p3_355) __extension__ ({ \
  48402   int8x8_t __ret_355; \
  48403   int8x8_t __s0_355 = __p0_355; \
  48404   int8x16_t __s2_355 = __p2_355; \
  48405   int8x8_t __rev0_355;  __rev0_355 = __builtin_shufflevector(__s0_355, __s0_355, 7, 6, 5, 4, 3, 2, 1, 0); \
  48406   int8x16_t __rev2_355;  __rev2_355 = __builtin_shufflevector(__s2_355, __s2_355, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  48407   __ret_355 = __noswap_vset_lane_s8(__noswap_vgetq_lane_s8(__rev2_355, __p3_355), __rev0_355, __p1_355); \
  48408   __ret_355 = __builtin_shufflevector(__ret_355, __ret_355, 7, 6, 5, 4, 3, 2, 1, 0); \
  48409   __ret_355; \
  48410 })
  48411 #endif
  48412 
  48413 #ifdef __LITTLE_ENDIAN__
  48414 #define vcopy_laneq_f32(__p0_356, __p1_356, __p2_356, __p3_356) __extension__ ({ \
  48415   float32x2_t __ret_356; \
  48416   float32x2_t __s0_356 = __p0_356; \
  48417   float32x4_t __s2_356 = __p2_356; \
  48418   __ret_356 = vset_lane_f32(vgetq_lane_f32(__s2_356, __p3_356), __s0_356, __p1_356); \
  48419   __ret_356; \
  48420 })
  48421 #else
  48422 #define vcopy_laneq_f32(__p0_357, __p1_357, __p2_357, __p3_357) __extension__ ({ \
  48423   float32x2_t __ret_357; \
  48424   float32x2_t __s0_357 = __p0_357; \
  48425   float32x4_t __s2_357 = __p2_357; \
  48426   float32x2_t __rev0_357;  __rev0_357 = __builtin_shufflevector(__s0_357, __s0_357, 1, 0); \
  48427   float32x4_t __rev2_357;  __rev2_357 = __builtin_shufflevector(__s2_357, __s2_357, 3, 2, 1, 0); \
  48428   __ret_357 = __noswap_vset_lane_f32(__noswap_vgetq_lane_f32(__rev2_357, __p3_357), __rev0_357, __p1_357); \
  48429   __ret_357 = __builtin_shufflevector(__ret_357, __ret_357, 1, 0); \
  48430   __ret_357; \
  48431 })
  48432 #endif
  48433 
  48434 #ifdef __LITTLE_ENDIAN__
  48435 #define vcopy_laneq_s32(__p0_358, __p1_358, __p2_358, __p3_358) __extension__ ({ \
  48436   int32x2_t __ret_358; \
  48437   int32x2_t __s0_358 = __p0_358; \
  48438   int32x4_t __s2_358 = __p2_358; \
  48439   __ret_358 = vset_lane_s32(vgetq_lane_s32(__s2_358, __p3_358), __s0_358, __p1_358); \
  48440   __ret_358; \
  48441 })
  48442 #else
  48443 #define vcopy_laneq_s32(__p0_359, __p1_359, __p2_359, __p3_359) __extension__ ({ \
  48444   int32x2_t __ret_359; \
  48445   int32x2_t __s0_359 = __p0_359; \
  48446   int32x4_t __s2_359 = __p2_359; \
  48447   int32x2_t __rev0_359;  __rev0_359 = __builtin_shufflevector(__s0_359, __s0_359, 1, 0); \
  48448   int32x4_t __rev2_359;  __rev2_359 = __builtin_shufflevector(__s2_359, __s2_359, 3, 2, 1, 0); \
  48449   __ret_359 = __noswap_vset_lane_s32(__noswap_vgetq_lane_s32(__rev2_359, __p3_359), __rev0_359, __p1_359); \
  48450   __ret_359 = __builtin_shufflevector(__ret_359, __ret_359, 1, 0); \
  48451   __ret_359; \
  48452 })
  48453 #endif
  48454 
  48455 #ifdef __LITTLE_ENDIAN__
  48456 #define vcopy_laneq_s64(__p0_360, __p1_360, __p2_360, __p3_360) __extension__ ({ \
  48457   int64x1_t __ret_360; \
  48458   int64x1_t __s0_360 = __p0_360; \
  48459   int64x2_t __s2_360 = __p2_360; \
  48460   __ret_360 = vset_lane_s64(vgetq_lane_s64(__s2_360, __p3_360), __s0_360, __p1_360); \
  48461   __ret_360; \
  48462 })
  48463 #else
  48464 #define vcopy_laneq_s64(__p0_361, __p1_361, __p2_361, __p3_361) __extension__ ({ \
  48465   int64x1_t __ret_361; \
  48466   int64x1_t __s0_361 = __p0_361; \
  48467   int64x2_t __s2_361 = __p2_361; \
  48468   int64x2_t __rev2_361;  __rev2_361 = __builtin_shufflevector(__s2_361, __s2_361, 1, 0); \
  48469   __ret_361 = vset_lane_s64(__noswap_vgetq_lane_s64(__rev2_361, __p3_361), __s0_361, __p1_361); \
  48470   __ret_361; \
  48471 })
  48472 #endif
  48473 
  48474 #ifdef __LITTLE_ENDIAN__
  48475 #define vcopy_laneq_s16(__p0_362, __p1_362, __p2_362, __p3_362) __extension__ ({ \
  48476   int16x4_t __ret_362; \
  48477   int16x4_t __s0_362 = __p0_362; \
  48478   int16x8_t __s2_362 = __p2_362; \
  48479   __ret_362 = vset_lane_s16(vgetq_lane_s16(__s2_362, __p3_362), __s0_362, __p1_362); \
  48480   __ret_362; \
  48481 })
  48482 #else
  48483 #define vcopy_laneq_s16(__p0_363, __p1_363, __p2_363, __p3_363) __extension__ ({ \
  48484   int16x4_t __ret_363; \
  48485   int16x4_t __s0_363 = __p0_363; \
  48486   int16x8_t __s2_363 = __p2_363; \
  48487   int16x4_t __rev0_363;  __rev0_363 = __builtin_shufflevector(__s0_363, __s0_363, 3, 2, 1, 0); \
  48488   int16x8_t __rev2_363;  __rev2_363 = __builtin_shufflevector(__s2_363, __s2_363, 7, 6, 5, 4, 3, 2, 1, 0); \
  48489   __ret_363 = __noswap_vset_lane_s16(__noswap_vgetq_lane_s16(__rev2_363, __p3_363), __rev0_363, __p1_363); \
  48490   __ret_363 = __builtin_shufflevector(__ret_363, __ret_363, 3, 2, 1, 0); \
  48491   __ret_363; \
  48492 })
  48493 #endif
  48494 
  48495 #define vcreate_p64(__p0) __extension__ ({ \
  48496   poly64x1_t __ret; \
  48497   uint64_t __promote = __p0; \
  48498   __ret = (poly64x1_t)(__promote); \
  48499   __ret; \
  48500 })
  48501 #define vcreate_f64(__p0) __extension__ ({ \
  48502   float64x1_t __ret; \
  48503   uint64_t __promote = __p0; \
  48504   __ret = (float64x1_t)(__promote); \
  48505   __ret; \
  48506 })
  48507 __ai __attribute__((target("neon"))) float32_t vcvts_f32_s32(int32_t __p0) {
  48508   float32_t __ret;
  48509   __ret = (float32_t) __builtin_neon_vcvts_f32_s32(__p0);
  48510   return __ret;
  48511 }
  48512 __ai __attribute__((target("neon"))) float32_t vcvts_f32_u32(uint32_t __p0) {
  48513   float32_t __ret;
  48514   __ret = (float32_t) __builtin_neon_vcvts_f32_u32(__p0);
  48515   return __ret;
  48516 }
  48517 #ifdef __LITTLE_ENDIAN__
  48518 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_f64(float64x2_t __p0) {
  48519   float32x2_t __ret;
  48520   __ret = (float32x2_t) __builtin_neon_vcvt_f32_f64((int8x16_t)__p0, 9);
  48521   return __ret;
  48522 }
  48523 #else
  48524 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_f64(float64x2_t __p0) {
  48525   float32x2_t __ret;
  48526   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48527   __ret = (float32x2_t) __builtin_neon_vcvt_f32_f64((int8x16_t)__rev0, 9);
  48528   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48529   return __ret;
  48530 }
  48531 __ai __attribute__((target("neon"))) float32x2_t __noswap_vcvt_f32_f64(float64x2_t __p0) {
  48532   float32x2_t __ret;
  48533   __ret = (float32x2_t) __builtin_neon_vcvt_f32_f64((int8x16_t)__p0, 9);
  48534   return __ret;
  48535 }
  48536 #endif
  48537 
  48538 __ai __attribute__((target("neon"))) float64_t vcvtd_f64_s64(int64_t __p0) {
  48539   float64_t __ret;
  48540   __ret = (float64_t) __builtin_neon_vcvtd_f64_s64(__p0);
  48541   return __ret;
  48542 }
  48543 __ai __attribute__((target("neon"))) float64_t vcvtd_f64_u64(uint64_t __p0) {
  48544   float64_t __ret;
  48545   __ret = (float64_t) __builtin_neon_vcvtd_f64_u64(__p0);
  48546   return __ret;
  48547 }
  48548 #ifdef __LITTLE_ENDIAN__
  48549 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_u64(uint64x2_t __p0) {
  48550   float64x2_t __ret;
  48551   __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__p0, 51);
  48552   return __ret;
  48553 }
  48554 #else
  48555 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_u64(uint64x2_t __p0) {
  48556   float64x2_t __ret;
  48557   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48558   __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__rev0, 51);
  48559   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48560   return __ret;
  48561 }
  48562 #endif
  48563 
  48564 #ifdef __LITTLE_ENDIAN__
  48565 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_s64(int64x2_t __p0) {
  48566   float64x2_t __ret;
  48567   __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__p0, 35);
  48568   return __ret;
  48569 }
  48570 #else
  48571 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_s64(int64x2_t __p0) {
  48572   float64x2_t __ret;
  48573   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48574   __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__rev0, 35);
  48575   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48576   return __ret;
  48577 }
  48578 #endif
  48579 
  48580 __ai __attribute__((target("neon"))) float64x1_t vcvt_f64_u64(uint64x1_t __p0) {
  48581   float64x1_t __ret;
  48582   __ret = (float64x1_t) __builtin_neon_vcvt_f64_v((int8x8_t)__p0, 19);
  48583   return __ret;
  48584 }
  48585 __ai __attribute__((target("neon"))) float64x1_t vcvt_f64_s64(int64x1_t __p0) {
  48586   float64x1_t __ret;
  48587   __ret = (float64x1_t) __builtin_neon_vcvt_f64_v((int8x8_t)__p0, 3);
  48588   return __ret;
  48589 }
  48590 #ifdef __LITTLE_ENDIAN__
  48591 __ai __attribute__((target("neon"))) float64x2_t vcvt_f64_f32(float32x2_t __p0) {
  48592   float64x2_t __ret;
  48593   __ret = (float64x2_t) __builtin_neon_vcvt_f64_f32((int8x8_t)__p0, 42);
  48594   return __ret;
  48595 }
  48596 #else
  48597 __ai __attribute__((target("neon"))) float64x2_t vcvt_f64_f32(float32x2_t __p0) {
  48598   float64x2_t __ret;
  48599   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48600   __ret = (float64x2_t) __builtin_neon_vcvt_f64_f32((int8x8_t)__rev0, 42);
  48601   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48602   return __ret;
  48603 }
  48604 __ai __attribute__((target("neon"))) float64x2_t __noswap_vcvt_f64_f32(float32x2_t __p0) {
  48605   float64x2_t __ret;
  48606   __ret = (float64x2_t) __builtin_neon_vcvt_f64_f32((int8x8_t)__p0, 42);
  48607   return __ret;
  48608 }
  48609 #endif
  48610 
  48611 #ifdef __LITTLE_ENDIAN__
  48612 __ai __attribute__((target("neon"))) float16x8_t vcvt_high_f16_f32(float16x4_t __p0, float32x4_t __p1) {
  48613   float16x8_t __ret;
  48614   __ret = vcombine_f16(__p0, vcvt_f16_f32(__p1));
  48615   return __ret;
  48616 }
  48617 #else
  48618 __ai __attribute__((target("neon"))) float16x8_t vcvt_high_f16_f32(float16x4_t __p0, float32x4_t __p1) {
  48619   float16x8_t __ret;
  48620   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  48621   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  48622   __ret = __noswap_vcombine_f16(__rev0, __noswap_vcvt_f16_f32(__rev1));
  48623   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  48624   return __ret;
  48625 }
  48626 #endif
  48627 
  48628 #ifdef __LITTLE_ENDIAN__
  48629 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f16(float16x8_t __p0) {
  48630   float32x4_t __ret;
  48631   __ret = vcvt_f32_f16(vget_high_f16(__p0));
  48632   return __ret;
  48633 }
  48634 #else
  48635 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f16(float16x8_t __p0) {
  48636   float32x4_t __ret;
  48637   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  48638   __ret = __noswap_vcvt_f32_f16(__noswap_vget_high_f16(__rev0));
  48639   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  48640   return __ret;
  48641 }
  48642 #endif
  48643 
  48644 #ifdef __LITTLE_ENDIAN__
  48645 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f64(float32x2_t __p0, float64x2_t __p1) {
  48646   float32x4_t __ret;
  48647   __ret = vcombine_f32(__p0, vcvt_f32_f64(__p1));
  48648   return __ret;
  48649 }
  48650 #else
  48651 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f64(float32x2_t __p0, float64x2_t __p1) {
  48652   float32x4_t __ret;
  48653   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48654   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  48655   __ret = __noswap_vcombine_f32(__rev0, __noswap_vcvt_f32_f64(__rev1));
  48656   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  48657   return __ret;
  48658 }
  48659 #endif
  48660 
  48661 #ifdef __LITTLE_ENDIAN__
  48662 __ai __attribute__((target("neon"))) float64x2_t vcvt_high_f64_f32(float32x4_t __p0) {
  48663   float64x2_t __ret;
  48664   __ret = vcvt_f64_f32(vget_high_f32(__p0));
  48665   return __ret;
  48666 }
  48667 #else
  48668 __ai __attribute__((target("neon"))) float64x2_t vcvt_high_f64_f32(float32x4_t __p0) {
  48669   float64x2_t __ret;
  48670   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  48671   __ret = __noswap_vcvt_f64_f32(__noswap_vget_high_f32(__rev0));
  48672   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48673   return __ret;
  48674 }
  48675 #endif
  48676 
  48677 #define vcvts_n_f32_u32(__p0, __p1) __extension__ ({ \
  48678   float32_t __ret; \
  48679   uint32_t __s0 = __p0; \
  48680   __ret = (float32_t) __builtin_neon_vcvts_n_f32_u32(__s0, __p1); \
  48681   __ret; \
  48682 })
  48683 #define vcvts_n_f32_s32(__p0, __p1) __extension__ ({ \
  48684   float32_t __ret; \
  48685   int32_t __s0 = __p0; \
  48686   __ret = (float32_t) __builtin_neon_vcvts_n_f32_s32(__s0, __p1); \
  48687   __ret; \
  48688 })
  48689 #ifdef __LITTLE_ENDIAN__
  48690 #define vcvtq_n_f64_u64(__p0, __p1) __extension__ ({ \
  48691   float64x2_t __ret; \
  48692   uint64x2_t __s0 = __p0; \
  48693   __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__s0, __p1, 51); \
  48694   __ret; \
  48695 })
  48696 #else
  48697 #define vcvtq_n_f64_u64(__p0, __p1) __extension__ ({ \
  48698   float64x2_t __ret; \
  48699   uint64x2_t __s0 = __p0; \
  48700   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  48701   __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__rev0, __p1, 51); \
  48702   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  48703   __ret; \
  48704 })
  48705 #endif
  48706 
  48707 #ifdef __LITTLE_ENDIAN__
  48708 #define vcvtq_n_f64_s64(__p0, __p1) __extension__ ({ \
  48709   float64x2_t __ret; \
  48710   int64x2_t __s0 = __p0; \
  48711   __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__s0, __p1, 35); \
  48712   __ret; \
  48713 })
  48714 #else
  48715 #define vcvtq_n_f64_s64(__p0, __p1) __extension__ ({ \
  48716   float64x2_t __ret; \
  48717   int64x2_t __s0 = __p0; \
  48718   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  48719   __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__rev0, __p1, 35); \
  48720   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  48721   __ret; \
  48722 })
  48723 #endif
  48724 
  48725 #define vcvt_n_f64_u64(__p0, __p1) __extension__ ({ \
  48726   float64x1_t __ret; \
  48727   uint64x1_t __s0 = __p0; \
  48728   __ret = (float64x1_t) __builtin_neon_vcvt_n_f64_v((int8x8_t)__s0, __p1, 19); \
  48729   __ret; \
  48730 })
  48731 #define vcvt_n_f64_s64(__p0, __p1) __extension__ ({ \
  48732   float64x1_t __ret; \
  48733   int64x1_t __s0 = __p0; \
  48734   __ret = (float64x1_t) __builtin_neon_vcvt_n_f64_v((int8x8_t)__s0, __p1, 3); \
  48735   __ret; \
  48736 })
  48737 #define vcvtd_n_f64_u64(__p0, __p1) __extension__ ({ \
  48738   float64_t __ret; \
  48739   uint64_t __s0 = __p0; \
  48740   __ret = (float64_t) __builtin_neon_vcvtd_n_f64_u64(__s0, __p1); \
  48741   __ret; \
  48742 })
  48743 #define vcvtd_n_f64_s64(__p0, __p1) __extension__ ({ \
  48744   float64_t __ret; \
  48745   int64_t __s0 = __p0; \
  48746   __ret = (float64_t) __builtin_neon_vcvtd_n_f64_s64(__s0, __p1); \
  48747   __ret; \
  48748 })
  48749 #define vcvts_n_s32_f32(__p0, __p1) __extension__ ({ \
  48750   int32_t __ret; \
  48751   float32_t __s0 = __p0; \
  48752   __ret = (int32_t) __builtin_neon_vcvts_n_s32_f32(__s0, __p1); \
  48753   __ret; \
  48754 })
  48755 #ifdef __LITTLE_ENDIAN__
  48756 #define vcvtq_n_s64_f64(__p0, __p1) __extension__ ({ \
  48757   int64x2_t __ret; \
  48758   float64x2_t __s0 = __p0; \
  48759   __ret = (int64x2_t) __builtin_neon_vcvtq_n_s64_v((int8x16_t)__s0, __p1, 35); \
  48760   __ret; \
  48761 })
  48762 #else
  48763 #define vcvtq_n_s64_f64(__p0, __p1) __extension__ ({ \
  48764   int64x2_t __ret; \
  48765   float64x2_t __s0 = __p0; \
  48766   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  48767   __ret = (int64x2_t) __builtin_neon_vcvtq_n_s64_v((int8x16_t)__rev0, __p1, 35); \
  48768   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  48769   __ret; \
  48770 })
  48771 #endif
  48772 
  48773 #define vcvt_n_s64_f64(__p0, __p1) __extension__ ({ \
  48774   int64x1_t __ret; \
  48775   float64x1_t __s0 = __p0; \
  48776   __ret = (int64x1_t) __builtin_neon_vcvt_n_s64_v((int8x8_t)__s0, __p1, 3); \
  48777   __ret; \
  48778 })
  48779 #define vcvtd_n_s64_f64(__p0, __p1) __extension__ ({ \
  48780   int64_t __ret; \
  48781   float64_t __s0 = __p0; \
  48782   __ret = (int64_t) __builtin_neon_vcvtd_n_s64_f64(__s0, __p1); \
  48783   __ret; \
  48784 })
  48785 #define vcvts_n_u32_f32(__p0, __p1) __extension__ ({ \
  48786   uint32_t __ret; \
  48787   float32_t __s0 = __p0; \
  48788   __ret = (uint32_t) __builtin_neon_vcvts_n_u32_f32(__s0, __p1); \
  48789   __ret; \
  48790 })
  48791 #ifdef __LITTLE_ENDIAN__
  48792 #define vcvtq_n_u64_f64(__p0, __p1) __extension__ ({ \
  48793   uint64x2_t __ret; \
  48794   float64x2_t __s0 = __p0; \
  48795   __ret = (uint64x2_t) __builtin_neon_vcvtq_n_u64_v((int8x16_t)__s0, __p1, 51); \
  48796   __ret; \
  48797 })
  48798 #else
  48799 #define vcvtq_n_u64_f64(__p0, __p1) __extension__ ({ \
  48800   uint64x2_t __ret; \
  48801   float64x2_t __s0 = __p0; \
  48802   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  48803   __ret = (uint64x2_t) __builtin_neon_vcvtq_n_u64_v((int8x16_t)__rev0, __p1, 51); \
  48804   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  48805   __ret; \
  48806 })
  48807 #endif
  48808 
  48809 #define vcvt_n_u64_f64(__p0, __p1) __extension__ ({ \
  48810   uint64x1_t __ret; \
  48811   float64x1_t __s0 = __p0; \
  48812   __ret = (uint64x1_t) __builtin_neon_vcvt_n_u64_v((int8x8_t)__s0, __p1, 19); \
  48813   __ret; \
  48814 })
  48815 #define vcvtd_n_u64_f64(__p0, __p1) __extension__ ({ \
  48816   uint64_t __ret; \
  48817   float64_t __s0 = __p0; \
  48818   __ret = (uint64_t) __builtin_neon_vcvtd_n_u64_f64(__s0, __p1); \
  48819   __ret; \
  48820 })
  48821 __ai __attribute__((target("neon"))) int32_t vcvts_s32_f32(float32_t __p0) {
  48822   int32_t __ret;
  48823   __ret = (int32_t) __builtin_neon_vcvts_s32_f32(__p0);
  48824   return __ret;
  48825 }
  48826 __ai __attribute__((target("neon"))) int64_t vcvtd_s64_f64(float64_t __p0) {
  48827   int64_t __ret;
  48828   __ret = (int64_t) __builtin_neon_vcvtd_s64_f64(__p0);
  48829   return __ret;
  48830 }
  48831 #ifdef __LITTLE_ENDIAN__
  48832 __ai __attribute__((target("neon"))) int64x2_t vcvtq_s64_f64(float64x2_t __p0) {
  48833   int64x2_t __ret;
  48834   __ret = (int64x2_t) __builtin_neon_vcvtq_s64_v((int8x16_t)__p0, 35);
  48835   return __ret;
  48836 }
  48837 #else
  48838 __ai __attribute__((target("neon"))) int64x2_t vcvtq_s64_f64(float64x2_t __p0) {
  48839   int64x2_t __ret;
  48840   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48841   __ret = (int64x2_t) __builtin_neon_vcvtq_s64_v((int8x16_t)__rev0, 35);
  48842   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48843   return __ret;
  48844 }
  48845 #endif
  48846 
  48847 __ai __attribute__((target("neon"))) int64x1_t vcvt_s64_f64(float64x1_t __p0) {
  48848   int64x1_t __ret;
  48849   __ret = (int64x1_t) __builtin_neon_vcvt_s64_v((int8x8_t)__p0, 3);
  48850   return __ret;
  48851 }
  48852 __ai __attribute__((target("neon"))) uint32_t vcvts_u32_f32(float32_t __p0) {
  48853   uint32_t __ret;
  48854   __ret = (uint32_t) __builtin_neon_vcvts_u32_f32(__p0);
  48855   return __ret;
  48856 }
  48857 __ai __attribute__((target("neon"))) uint64_t vcvtd_u64_f64(float64_t __p0) {
  48858   uint64_t __ret;
  48859   __ret = (uint64_t) __builtin_neon_vcvtd_u64_f64(__p0);
  48860   return __ret;
  48861 }
  48862 #ifdef __LITTLE_ENDIAN__
  48863 __ai __attribute__((target("neon"))) uint64x2_t vcvtq_u64_f64(float64x2_t __p0) {
  48864   uint64x2_t __ret;
  48865   __ret = (uint64x2_t) __builtin_neon_vcvtq_u64_v((int8x16_t)__p0, 51);
  48866   return __ret;
  48867 }
  48868 #else
  48869 __ai __attribute__((target("neon"))) uint64x2_t vcvtq_u64_f64(float64x2_t __p0) {
  48870   uint64x2_t __ret;
  48871   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48872   __ret = (uint64x2_t) __builtin_neon_vcvtq_u64_v((int8x16_t)__rev0, 51);
  48873   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48874   return __ret;
  48875 }
  48876 #endif
  48877 
  48878 __ai __attribute__((target("neon"))) uint64x1_t vcvt_u64_f64(float64x1_t __p0) {
  48879   uint64x1_t __ret;
  48880   __ret = (uint64x1_t) __builtin_neon_vcvt_u64_v((int8x8_t)__p0, 19);
  48881   return __ret;
  48882 }
  48883 __ai __attribute__((target("neon"))) int32_t vcvtas_s32_f32(float32_t __p0) {
  48884   int32_t __ret;
  48885   __ret = (int32_t) __builtin_neon_vcvtas_s32_f32(__p0);
  48886   return __ret;
  48887 }
  48888 #ifdef __LITTLE_ENDIAN__
  48889 __ai __attribute__((target("neon"))) int64x2_t vcvtaq_s64_f64(float64x2_t __p0) {
  48890   int64x2_t __ret;
  48891   __ret = (int64x2_t) __builtin_neon_vcvtaq_s64_v((int8x16_t)__p0, 35);
  48892   return __ret;
  48893 }
  48894 #else
  48895 __ai __attribute__((target("neon"))) int64x2_t vcvtaq_s64_f64(float64x2_t __p0) {
  48896   int64x2_t __ret;
  48897   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48898   __ret = (int64x2_t) __builtin_neon_vcvtaq_s64_v((int8x16_t)__rev0, 35);
  48899   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48900   return __ret;
  48901 }
  48902 #endif
  48903 
  48904 __ai __attribute__((target("neon"))) int64x1_t vcvta_s64_f64(float64x1_t __p0) {
  48905   int64x1_t __ret;
  48906   __ret = (int64x1_t) __builtin_neon_vcvta_s64_v((int8x8_t)__p0, 3);
  48907   return __ret;
  48908 }
  48909 __ai __attribute__((target("neon"))) int64_t vcvtad_s64_f64(float64_t __p0) {
  48910   int64_t __ret;
  48911   __ret = (int64_t) __builtin_neon_vcvtad_s64_f64(__p0);
  48912   return __ret;
  48913 }
  48914 __ai __attribute__((target("neon"))) uint32_t vcvtas_u32_f32(float32_t __p0) {
  48915   uint32_t __ret;
  48916   __ret = (uint32_t) __builtin_neon_vcvtas_u32_f32(__p0);
  48917   return __ret;
  48918 }
  48919 #ifdef __LITTLE_ENDIAN__
  48920 __ai __attribute__((target("neon"))) uint64x2_t vcvtaq_u64_f64(float64x2_t __p0) {
  48921   uint64x2_t __ret;
  48922   __ret = (uint64x2_t) __builtin_neon_vcvtaq_u64_v((int8x16_t)__p0, 51);
  48923   return __ret;
  48924 }
  48925 #else
  48926 __ai __attribute__((target("neon"))) uint64x2_t vcvtaq_u64_f64(float64x2_t __p0) {
  48927   uint64x2_t __ret;
  48928   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48929   __ret = (uint64x2_t) __builtin_neon_vcvtaq_u64_v((int8x16_t)__rev0, 51);
  48930   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48931   return __ret;
  48932 }
  48933 #endif
  48934 
  48935 __ai __attribute__((target("neon"))) uint64x1_t vcvta_u64_f64(float64x1_t __p0) {
  48936   uint64x1_t __ret;
  48937   __ret = (uint64x1_t) __builtin_neon_vcvta_u64_v((int8x8_t)__p0, 19);
  48938   return __ret;
  48939 }
  48940 __ai __attribute__((target("neon"))) uint64_t vcvtad_u64_f64(float64_t __p0) {
  48941   uint64_t __ret;
  48942   __ret = (uint64_t) __builtin_neon_vcvtad_u64_f64(__p0);
  48943   return __ret;
  48944 }
  48945 __ai __attribute__((target("neon"))) int32_t vcvtms_s32_f32(float32_t __p0) {
  48946   int32_t __ret;
  48947   __ret = (int32_t) __builtin_neon_vcvtms_s32_f32(__p0);
  48948   return __ret;
  48949 }
  48950 #ifdef __LITTLE_ENDIAN__
  48951 __ai __attribute__((target("neon"))) int64x2_t vcvtmq_s64_f64(float64x2_t __p0) {
  48952   int64x2_t __ret;
  48953   __ret = (int64x2_t) __builtin_neon_vcvtmq_s64_v((int8x16_t)__p0, 35);
  48954   return __ret;
  48955 }
  48956 #else
  48957 __ai __attribute__((target("neon"))) int64x2_t vcvtmq_s64_f64(float64x2_t __p0) {
  48958   int64x2_t __ret;
  48959   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48960   __ret = (int64x2_t) __builtin_neon_vcvtmq_s64_v((int8x16_t)__rev0, 35);
  48961   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48962   return __ret;
  48963 }
  48964 #endif
  48965 
  48966 __ai __attribute__((target("neon"))) int64x1_t vcvtm_s64_f64(float64x1_t __p0) {
  48967   int64x1_t __ret;
  48968   __ret = (int64x1_t) __builtin_neon_vcvtm_s64_v((int8x8_t)__p0, 3);
  48969   return __ret;
  48970 }
  48971 __ai __attribute__((target("neon"))) int64_t vcvtmd_s64_f64(float64_t __p0) {
  48972   int64_t __ret;
  48973   __ret = (int64_t) __builtin_neon_vcvtmd_s64_f64(__p0);
  48974   return __ret;
  48975 }
  48976 __ai __attribute__((target("neon"))) uint32_t vcvtms_u32_f32(float32_t __p0) {
  48977   uint32_t __ret;
  48978   __ret = (uint32_t) __builtin_neon_vcvtms_u32_f32(__p0);
  48979   return __ret;
  48980 }
  48981 #ifdef __LITTLE_ENDIAN__
  48982 __ai __attribute__((target("neon"))) uint64x2_t vcvtmq_u64_f64(float64x2_t __p0) {
  48983   uint64x2_t __ret;
  48984   __ret = (uint64x2_t) __builtin_neon_vcvtmq_u64_v((int8x16_t)__p0, 51);
  48985   return __ret;
  48986 }
  48987 #else
  48988 __ai __attribute__((target("neon"))) uint64x2_t vcvtmq_u64_f64(float64x2_t __p0) {
  48989   uint64x2_t __ret;
  48990   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  48991   __ret = (uint64x2_t) __builtin_neon_vcvtmq_u64_v((int8x16_t)__rev0, 51);
  48992   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  48993   return __ret;
  48994 }
  48995 #endif
  48996 
  48997 __ai __attribute__((target("neon"))) uint64x1_t vcvtm_u64_f64(float64x1_t __p0) {
  48998   uint64x1_t __ret;
  48999   __ret = (uint64x1_t) __builtin_neon_vcvtm_u64_v((int8x8_t)__p0, 19);
  49000   return __ret;
  49001 }
  49002 __ai __attribute__((target("neon"))) uint64_t vcvtmd_u64_f64(float64_t __p0) {
  49003   uint64_t __ret;
  49004   __ret = (uint64_t) __builtin_neon_vcvtmd_u64_f64(__p0);
  49005   return __ret;
  49006 }
  49007 __ai __attribute__((target("neon"))) int32_t vcvtns_s32_f32(float32_t __p0) {
  49008   int32_t __ret;
  49009   __ret = (int32_t) __builtin_neon_vcvtns_s32_f32(__p0);
  49010   return __ret;
  49011 }
  49012 #ifdef __LITTLE_ENDIAN__
  49013 __ai __attribute__((target("neon"))) int64x2_t vcvtnq_s64_f64(float64x2_t __p0) {
  49014   int64x2_t __ret;
  49015   __ret = (int64x2_t) __builtin_neon_vcvtnq_s64_v((int8x16_t)__p0, 35);
  49016   return __ret;
  49017 }
  49018 #else
  49019 __ai __attribute__((target("neon"))) int64x2_t vcvtnq_s64_f64(float64x2_t __p0) {
  49020   int64x2_t __ret;
  49021   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49022   __ret = (int64x2_t) __builtin_neon_vcvtnq_s64_v((int8x16_t)__rev0, 35);
  49023   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49024   return __ret;
  49025 }
  49026 #endif
  49027 
  49028 __ai __attribute__((target("neon"))) int64x1_t vcvtn_s64_f64(float64x1_t __p0) {
  49029   int64x1_t __ret;
  49030   __ret = (int64x1_t) __builtin_neon_vcvtn_s64_v((int8x8_t)__p0, 3);
  49031   return __ret;
  49032 }
  49033 __ai __attribute__((target("neon"))) int64_t vcvtnd_s64_f64(float64_t __p0) {
  49034   int64_t __ret;
  49035   __ret = (int64_t) __builtin_neon_vcvtnd_s64_f64(__p0);
  49036   return __ret;
  49037 }
  49038 __ai __attribute__((target("neon"))) uint32_t vcvtns_u32_f32(float32_t __p0) {
  49039   uint32_t __ret;
  49040   __ret = (uint32_t) __builtin_neon_vcvtns_u32_f32(__p0);
  49041   return __ret;
  49042 }
  49043 #ifdef __LITTLE_ENDIAN__
  49044 __ai __attribute__((target("neon"))) uint64x2_t vcvtnq_u64_f64(float64x2_t __p0) {
  49045   uint64x2_t __ret;
  49046   __ret = (uint64x2_t) __builtin_neon_vcvtnq_u64_v((int8x16_t)__p0, 51);
  49047   return __ret;
  49048 }
  49049 #else
  49050 __ai __attribute__((target("neon"))) uint64x2_t vcvtnq_u64_f64(float64x2_t __p0) {
  49051   uint64x2_t __ret;
  49052   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49053   __ret = (uint64x2_t) __builtin_neon_vcvtnq_u64_v((int8x16_t)__rev0, 51);
  49054   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49055   return __ret;
  49056 }
  49057 #endif
  49058 
  49059 __ai __attribute__((target("neon"))) uint64x1_t vcvtn_u64_f64(float64x1_t __p0) {
  49060   uint64x1_t __ret;
  49061   __ret = (uint64x1_t) __builtin_neon_vcvtn_u64_v((int8x8_t)__p0, 19);
  49062   return __ret;
  49063 }
  49064 __ai __attribute__((target("neon"))) uint64_t vcvtnd_u64_f64(float64_t __p0) {
  49065   uint64_t __ret;
  49066   __ret = (uint64_t) __builtin_neon_vcvtnd_u64_f64(__p0);
  49067   return __ret;
  49068 }
  49069 __ai __attribute__((target("neon"))) int32_t vcvtps_s32_f32(float32_t __p0) {
  49070   int32_t __ret;
  49071   __ret = (int32_t) __builtin_neon_vcvtps_s32_f32(__p0);
  49072   return __ret;
  49073 }
  49074 #ifdef __LITTLE_ENDIAN__
  49075 __ai __attribute__((target("neon"))) int64x2_t vcvtpq_s64_f64(float64x2_t __p0) {
  49076   int64x2_t __ret;
  49077   __ret = (int64x2_t) __builtin_neon_vcvtpq_s64_v((int8x16_t)__p0, 35);
  49078   return __ret;
  49079 }
  49080 #else
  49081 __ai __attribute__((target("neon"))) int64x2_t vcvtpq_s64_f64(float64x2_t __p0) {
  49082   int64x2_t __ret;
  49083   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49084   __ret = (int64x2_t) __builtin_neon_vcvtpq_s64_v((int8x16_t)__rev0, 35);
  49085   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49086   return __ret;
  49087 }
  49088 #endif
  49089 
  49090 __ai __attribute__((target("neon"))) int64x1_t vcvtp_s64_f64(float64x1_t __p0) {
  49091   int64x1_t __ret;
  49092   __ret = (int64x1_t) __builtin_neon_vcvtp_s64_v((int8x8_t)__p0, 3);
  49093   return __ret;
  49094 }
  49095 __ai __attribute__((target("neon"))) int64_t vcvtpd_s64_f64(float64_t __p0) {
  49096   int64_t __ret;
  49097   __ret = (int64_t) __builtin_neon_vcvtpd_s64_f64(__p0);
  49098   return __ret;
  49099 }
  49100 __ai __attribute__((target("neon"))) uint32_t vcvtps_u32_f32(float32_t __p0) {
  49101   uint32_t __ret;
  49102   __ret = (uint32_t) __builtin_neon_vcvtps_u32_f32(__p0);
  49103   return __ret;
  49104 }
  49105 #ifdef __LITTLE_ENDIAN__
  49106 __ai __attribute__((target("neon"))) uint64x2_t vcvtpq_u64_f64(float64x2_t __p0) {
  49107   uint64x2_t __ret;
  49108   __ret = (uint64x2_t) __builtin_neon_vcvtpq_u64_v((int8x16_t)__p0, 51);
  49109   return __ret;
  49110 }
  49111 #else
  49112 __ai __attribute__((target("neon"))) uint64x2_t vcvtpq_u64_f64(float64x2_t __p0) {
  49113   uint64x2_t __ret;
  49114   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49115   __ret = (uint64x2_t) __builtin_neon_vcvtpq_u64_v((int8x16_t)__rev0, 51);
  49116   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49117   return __ret;
  49118 }
  49119 #endif
  49120 
  49121 __ai __attribute__((target("neon"))) uint64x1_t vcvtp_u64_f64(float64x1_t __p0) {
  49122   uint64x1_t __ret;
  49123   __ret = (uint64x1_t) __builtin_neon_vcvtp_u64_v((int8x8_t)__p0, 19);
  49124   return __ret;
  49125 }
  49126 __ai __attribute__((target("neon"))) uint64_t vcvtpd_u64_f64(float64_t __p0) {
  49127   uint64_t __ret;
  49128   __ret = (uint64_t) __builtin_neon_vcvtpd_u64_f64(__p0);
  49129   return __ret;
  49130 }
  49131 __ai __attribute__((target("neon"))) float32_t vcvtxd_f32_f64(float64_t __p0) {
  49132   float32_t __ret;
  49133   __ret = (float32_t) __builtin_neon_vcvtxd_f32_f64(__p0);
  49134   return __ret;
  49135 }
  49136 #ifdef __LITTLE_ENDIAN__
  49137 __ai __attribute__((target("neon"))) float32x2_t vcvtx_f32_f64(float64x2_t __p0) {
  49138   float32x2_t __ret;
  49139   __ret = (float32x2_t) __builtin_neon_vcvtx_f32_v((int8x16_t)__p0, 42);
  49140   return __ret;
  49141 }
  49142 #else
  49143 __ai __attribute__((target("neon"))) float32x2_t vcvtx_f32_f64(float64x2_t __p0) {
  49144   float32x2_t __ret;
  49145   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49146   __ret = (float32x2_t) __builtin_neon_vcvtx_f32_v((int8x16_t)__rev0, 42);
  49147   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49148   return __ret;
  49149 }
  49150 __ai __attribute__((target("neon"))) float32x2_t __noswap_vcvtx_f32_f64(float64x2_t __p0) {
  49151   float32x2_t __ret;
  49152   __ret = (float32x2_t) __builtin_neon_vcvtx_f32_v((int8x16_t)__p0, 42);
  49153   return __ret;
  49154 }
  49155 #endif
  49156 
  49157 #ifdef __LITTLE_ENDIAN__
  49158 __ai __attribute__((target("neon"))) float32x4_t vcvtx_high_f32_f64(float32x2_t __p0, float64x2_t __p1) {
  49159   float32x4_t __ret;
  49160   __ret = vcombine_f32(__p0, vcvtx_f32_f64(__p1));
  49161   return __ret;
  49162 }
  49163 #else
  49164 __ai __attribute__((target("neon"))) float32x4_t vcvtx_high_f32_f64(float32x2_t __p0, float64x2_t __p1) {
  49165   float32x4_t __ret;
  49166   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49167   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  49168   __ret = __noswap_vcombine_f32(__rev0, __noswap_vcvtx_f32_f64(__rev1));
  49169   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  49170   return __ret;
  49171 }
  49172 #endif
  49173 
  49174 #ifdef __LITTLE_ENDIAN__
  49175 __ai __attribute__((target("neon"))) float64x2_t vdivq_f64(float64x2_t __p0, float64x2_t __p1) {
  49176   float64x2_t __ret;
  49177   __ret = __p0 / __p1;
  49178   return __ret;
  49179 }
  49180 #else
  49181 __ai __attribute__((target("neon"))) float64x2_t vdivq_f64(float64x2_t __p0, float64x2_t __p1) {
  49182   float64x2_t __ret;
  49183   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49184   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  49185   __ret = __rev0 / __rev1;
  49186   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49187   return __ret;
  49188 }
  49189 #endif
  49190 
  49191 #ifdef __LITTLE_ENDIAN__
  49192 __ai __attribute__((target("neon"))) float32x4_t vdivq_f32(float32x4_t __p0, float32x4_t __p1) {
  49193   float32x4_t __ret;
  49194   __ret = __p0 / __p1;
  49195   return __ret;
  49196 }
  49197 #else
  49198 __ai __attribute__((target("neon"))) float32x4_t vdivq_f32(float32x4_t __p0, float32x4_t __p1) {
  49199   float32x4_t __ret;
  49200   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  49201   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  49202   __ret = __rev0 / __rev1;
  49203   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  49204   return __ret;
  49205 }
  49206 #endif
  49207 
  49208 __ai __attribute__((target("neon"))) float64x1_t vdiv_f64(float64x1_t __p0, float64x1_t __p1) {
  49209   float64x1_t __ret;
  49210   __ret = __p0 / __p1;
  49211   return __ret;
  49212 }
  49213 #ifdef __LITTLE_ENDIAN__
  49214 __ai __attribute__((target("neon"))) float32x2_t vdiv_f32(float32x2_t __p0, float32x2_t __p1) {
  49215   float32x2_t __ret;
  49216   __ret = __p0 / __p1;
  49217   return __ret;
  49218 }
  49219 #else
  49220 __ai __attribute__((target("neon"))) float32x2_t vdiv_f32(float32x2_t __p0, float32x2_t __p1) {
  49221   float32x2_t __ret;
  49222   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  49223   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  49224   __ret = __rev0 / __rev1;
  49225   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  49226   return __ret;
  49227 }
  49228 #endif
  49229 
  49230 #ifdef __LITTLE_ENDIAN__
  49231 #define vdupb_lane_p8(__p0, __p1) __extension__ ({ \
  49232   poly8_t __ret; \
  49233   poly8x8_t __s0 = __p0; \
  49234   __ret = (poly8_t) __builtin_neon_vdupb_lane_i8((poly8x8_t)__s0, __p1); \
  49235   __ret; \
  49236 })
  49237 #else
  49238 #define vdupb_lane_p8(__p0, __p1) __extension__ ({ \
  49239   poly8_t __ret; \
  49240   poly8x8_t __s0 = __p0; \
  49241   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49242   __ret = (poly8_t) __builtin_neon_vdupb_lane_i8((poly8x8_t)__rev0, __p1); \
  49243   __ret; \
  49244 })
  49245 #endif
  49246 
  49247 #ifdef __LITTLE_ENDIAN__
  49248 #define vduph_lane_p16(__p0, __p1) __extension__ ({ \
  49249   poly16_t __ret; \
  49250   poly16x4_t __s0 = __p0; \
  49251   __ret = (poly16_t) __builtin_neon_vduph_lane_i16((poly16x4_t)__s0, __p1); \
  49252   __ret; \
  49253 })
  49254 #else
  49255 #define vduph_lane_p16(__p0, __p1) __extension__ ({ \
  49256   poly16_t __ret; \
  49257   poly16x4_t __s0 = __p0; \
  49258   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49259   __ret = (poly16_t) __builtin_neon_vduph_lane_i16((poly16x4_t)__rev0, __p1); \
  49260   __ret; \
  49261 })
  49262 #endif
  49263 
  49264 #ifdef __LITTLE_ENDIAN__
  49265 #define vdupb_lane_u8(__p0, __p1) __extension__ ({ \
  49266   uint8_t __ret; \
  49267   uint8x8_t __s0 = __p0; \
  49268   __ret = (uint8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__s0, __p1); \
  49269   __ret; \
  49270 })
  49271 #else
  49272 #define vdupb_lane_u8(__p0, __p1) __extension__ ({ \
  49273   uint8_t __ret; \
  49274   uint8x8_t __s0 = __p0; \
  49275   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49276   __ret = (uint8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__rev0, __p1); \
  49277   __ret; \
  49278 })
  49279 #endif
  49280 
  49281 #ifdef __LITTLE_ENDIAN__
  49282 #define vdups_lane_u32(__p0, __p1) __extension__ ({ \
  49283   uint32_t __ret; \
  49284   uint32x2_t __s0 = __p0; \
  49285   __ret = (uint32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__s0, __p1); \
  49286   __ret; \
  49287 })
  49288 #else
  49289 #define vdups_lane_u32(__p0, __p1) __extension__ ({ \
  49290   uint32_t __ret; \
  49291   uint32x2_t __s0 = __p0; \
  49292   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  49293   __ret = (uint32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__rev0, __p1); \
  49294   __ret; \
  49295 })
  49296 #endif
  49297 
  49298 #define vdupd_lane_u64(__p0, __p1) __extension__ ({ \
  49299   uint64_t __ret; \
  49300   uint64x1_t __s0 = __p0; \
  49301   __ret = (uint64_t) __builtin_neon_vdupd_lane_i64((int64x1_t)__s0, __p1); \
  49302   __ret; \
  49303 })
  49304 #ifdef __LITTLE_ENDIAN__
  49305 #define vduph_lane_u16(__p0, __p1) __extension__ ({ \
  49306   uint16_t __ret; \
  49307   uint16x4_t __s0 = __p0; \
  49308   __ret = (uint16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__s0, __p1); \
  49309   __ret; \
  49310 })
  49311 #else
  49312 #define vduph_lane_u16(__p0, __p1) __extension__ ({ \
  49313   uint16_t __ret; \
  49314   uint16x4_t __s0 = __p0; \
  49315   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49316   __ret = (uint16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__rev0, __p1); \
  49317   __ret; \
  49318 })
  49319 #endif
  49320 
  49321 #ifdef __LITTLE_ENDIAN__
  49322 #define vdupb_lane_s8(__p0, __p1) __extension__ ({ \
  49323   int8_t __ret; \
  49324   int8x8_t __s0 = __p0; \
  49325   __ret = (int8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__s0, __p1); \
  49326   __ret; \
  49327 })
  49328 #else
  49329 #define vdupb_lane_s8(__p0, __p1) __extension__ ({ \
  49330   int8_t __ret; \
  49331   int8x8_t __s0 = __p0; \
  49332   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49333   __ret = (int8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__rev0, __p1); \
  49334   __ret; \
  49335 })
  49336 #endif
  49337 
  49338 #define vdupd_lane_f64(__p0, __p1) __extension__ ({ \
  49339   float64_t __ret; \
  49340   float64x1_t __s0 = __p0; \
  49341   __ret = (float64_t) __builtin_neon_vdupd_lane_f64((float64x1_t)__s0, __p1); \
  49342   __ret; \
  49343 })
  49344 #ifdef __LITTLE_ENDIAN__
  49345 #define vdups_lane_f32(__p0, __p1) __extension__ ({ \
  49346   float32_t __ret; \
  49347   float32x2_t __s0 = __p0; \
  49348   __ret = (float32_t) __builtin_neon_vdups_lane_f32((float32x2_t)__s0, __p1); \
  49349   __ret; \
  49350 })
  49351 #else
  49352 #define vdups_lane_f32(__p0, __p1) __extension__ ({ \
  49353   float32_t __ret; \
  49354   float32x2_t __s0 = __p0; \
  49355   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  49356   __ret = (float32_t) __builtin_neon_vdups_lane_f32((float32x2_t)__rev0, __p1); \
  49357   __ret; \
  49358 })
  49359 #endif
  49360 
  49361 #ifdef __LITTLE_ENDIAN__
  49362 #define vdups_lane_s32(__p0, __p1) __extension__ ({ \
  49363   int32_t __ret; \
  49364   int32x2_t __s0 = __p0; \
  49365   __ret = (int32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__s0, __p1); \
  49366   __ret; \
  49367 })
  49368 #else
  49369 #define vdups_lane_s32(__p0, __p1) __extension__ ({ \
  49370   int32_t __ret; \
  49371   int32x2_t __s0 = __p0; \
  49372   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  49373   __ret = (int32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__rev0, __p1); \
  49374   __ret; \
  49375 })
  49376 #endif
  49377 
  49378 #define vdupd_lane_s64(__p0, __p1) __extension__ ({ \
  49379   int64_t __ret; \
  49380   int64x1_t __s0 = __p0; \
  49381   __ret = (int64_t) __builtin_neon_vdupd_lane_i64((int64x1_t)__s0, __p1); \
  49382   __ret; \
  49383 })
  49384 #ifdef __LITTLE_ENDIAN__
  49385 #define vduph_lane_s16(__p0, __p1) __extension__ ({ \
  49386   int16_t __ret; \
  49387   int16x4_t __s0 = __p0; \
  49388   __ret = (int16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__s0, __p1); \
  49389   __ret; \
  49390 })
  49391 #else
  49392 #define vduph_lane_s16(__p0, __p1) __extension__ ({ \
  49393   int16_t __ret; \
  49394   int16x4_t __s0 = __p0; \
  49395   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49396   __ret = (int16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__rev0, __p1); \
  49397   __ret; \
  49398 })
  49399 #endif
  49400 
  49401 #ifdef __LITTLE_ENDIAN__
  49402 #define vduph_lane_f16(__p0, __p1) __extension__ ({ \
  49403   float16_t __ret; \
  49404   float16x4_t __s0 = __p0; \
  49405   __ret = (float16_t) __builtin_neon_vduph_lane_f16((float16x4_t)__s0, __p1); \
  49406   __ret; \
  49407 })
  49408 #else
  49409 #define vduph_lane_f16(__p0, __p1) __extension__ ({ \
  49410   float16_t __ret; \
  49411   float16x4_t __s0 = __p0; \
  49412   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49413   __ret = (float16_t) __builtin_neon_vduph_lane_f16((float16x4_t)__rev0, __p1); \
  49414   __ret; \
  49415 })
  49416 #endif
  49417 
  49418 #define vdup_lane_p64(__p0_364, __p1_364) __extension__ ({ \
  49419   poly64x1_t __ret_364; \
  49420   poly64x1_t __s0_364 = __p0_364; \
  49421   __ret_364 = splat_lane_p64(__s0_364, __p1_364); \
  49422   __ret_364; \
  49423 })
  49424 #ifdef __LITTLE_ENDIAN__
  49425 #define vdupq_lane_p64(__p0_365, __p1_365) __extension__ ({ \
  49426   poly64x2_t __ret_365; \
  49427   poly64x1_t __s0_365 = __p0_365; \
  49428   __ret_365 = splatq_lane_p64(__s0_365, __p1_365); \
  49429   __ret_365; \
  49430 })
  49431 #else
  49432 #define vdupq_lane_p64(__p0_366, __p1_366) __extension__ ({ \
  49433   poly64x2_t __ret_366; \
  49434   poly64x1_t __s0_366 = __p0_366; \
  49435   __ret_366 = __noswap_splatq_lane_p64(__s0_366, __p1_366); \
  49436   __ret_366 = __builtin_shufflevector(__ret_366, __ret_366, 1, 0); \
  49437   __ret_366; \
  49438 })
  49439 #endif
  49440 
  49441 #ifdef __LITTLE_ENDIAN__
  49442 #define vdupq_lane_f64(__p0_367, __p1_367) __extension__ ({ \
  49443   float64x2_t __ret_367; \
  49444   float64x1_t __s0_367 = __p0_367; \
  49445   __ret_367 = splatq_lane_f64(__s0_367, __p1_367); \
  49446   __ret_367; \
  49447 })
  49448 #else
  49449 #define vdupq_lane_f64(__p0_368, __p1_368) __extension__ ({ \
  49450   float64x2_t __ret_368; \
  49451   float64x1_t __s0_368 = __p0_368; \
  49452   __ret_368 = __noswap_splatq_lane_f64(__s0_368, __p1_368); \
  49453   __ret_368 = __builtin_shufflevector(__ret_368, __ret_368, 1, 0); \
  49454   __ret_368; \
  49455 })
  49456 #endif
  49457 
  49458 #define vdup_lane_f64(__p0_369, __p1_369) __extension__ ({ \
  49459   float64x1_t __ret_369; \
  49460   float64x1_t __s0_369 = __p0_369; \
  49461   __ret_369 = splat_lane_f64(__s0_369, __p1_369); \
  49462   __ret_369; \
  49463 })
  49464 #ifdef __LITTLE_ENDIAN__
  49465 #define vdupb_laneq_p8(__p0, __p1) __extension__ ({ \
  49466   poly8_t __ret; \
  49467   poly8x16_t __s0 = __p0; \
  49468   __ret = (poly8_t) __builtin_neon_vdupb_laneq_i8((poly8x16_t)__s0, __p1); \
  49469   __ret; \
  49470 })
  49471 #else
  49472 #define vdupb_laneq_p8(__p0, __p1) __extension__ ({ \
  49473   poly8_t __ret; \
  49474   poly8x16_t __s0 = __p0; \
  49475   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49476   __ret = (poly8_t) __builtin_neon_vdupb_laneq_i8((poly8x16_t)__rev0, __p1); \
  49477   __ret; \
  49478 })
  49479 #endif
  49480 
  49481 #ifdef __LITTLE_ENDIAN__
  49482 #define vduph_laneq_p16(__p0, __p1) __extension__ ({ \
  49483   poly16_t __ret; \
  49484   poly16x8_t __s0 = __p0; \
  49485   __ret = (poly16_t) __builtin_neon_vduph_laneq_i16((poly16x8_t)__s0, __p1); \
  49486   __ret; \
  49487 })
  49488 #else
  49489 #define vduph_laneq_p16(__p0, __p1) __extension__ ({ \
  49490   poly16_t __ret; \
  49491   poly16x8_t __s0 = __p0; \
  49492   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49493   __ret = (poly16_t) __builtin_neon_vduph_laneq_i16((poly16x8_t)__rev0, __p1); \
  49494   __ret; \
  49495 })
  49496 #endif
  49497 
  49498 #ifdef __LITTLE_ENDIAN__
  49499 #define vdupb_laneq_u8(__p0, __p1) __extension__ ({ \
  49500   uint8_t __ret; \
  49501   uint8x16_t __s0 = __p0; \
  49502   __ret = (uint8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__s0, __p1); \
  49503   __ret; \
  49504 })
  49505 #else
  49506 #define vdupb_laneq_u8(__p0, __p1) __extension__ ({ \
  49507   uint8_t __ret; \
  49508   uint8x16_t __s0 = __p0; \
  49509   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49510   __ret = (uint8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__rev0, __p1); \
  49511   __ret; \
  49512 })
  49513 #endif
  49514 
  49515 #ifdef __LITTLE_ENDIAN__
  49516 #define vdups_laneq_u32(__p0, __p1) __extension__ ({ \
  49517   uint32_t __ret; \
  49518   uint32x4_t __s0 = __p0; \
  49519   __ret = (uint32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__s0, __p1); \
  49520   __ret; \
  49521 })
  49522 #else
  49523 #define vdups_laneq_u32(__p0, __p1) __extension__ ({ \
  49524   uint32_t __ret; \
  49525   uint32x4_t __s0 = __p0; \
  49526   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49527   __ret = (uint32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__rev0, __p1); \
  49528   __ret; \
  49529 })
  49530 #endif
  49531 
  49532 #ifdef __LITTLE_ENDIAN__
  49533 #define vdupd_laneq_u64(__p0, __p1) __extension__ ({ \
  49534   uint64_t __ret; \
  49535   uint64x2_t __s0 = __p0; \
  49536   __ret = (uint64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__s0, __p1); \
  49537   __ret; \
  49538 })
  49539 #else
  49540 #define vdupd_laneq_u64(__p0, __p1) __extension__ ({ \
  49541   uint64_t __ret; \
  49542   uint64x2_t __s0 = __p0; \
  49543   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  49544   __ret = (uint64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__rev0, __p1); \
  49545   __ret; \
  49546 })
  49547 #endif
  49548 
  49549 #ifdef __LITTLE_ENDIAN__
  49550 #define vduph_laneq_u16(__p0, __p1) __extension__ ({ \
  49551   uint16_t __ret; \
  49552   uint16x8_t __s0 = __p0; \
  49553   __ret = (uint16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__s0, __p1); \
  49554   __ret; \
  49555 })
  49556 #else
  49557 #define vduph_laneq_u16(__p0, __p1) __extension__ ({ \
  49558   uint16_t __ret; \
  49559   uint16x8_t __s0 = __p0; \
  49560   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49561   __ret = (uint16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__rev0, __p1); \
  49562   __ret; \
  49563 })
  49564 #endif
  49565 
  49566 #ifdef __LITTLE_ENDIAN__
  49567 #define vdupb_laneq_s8(__p0, __p1) __extension__ ({ \
  49568   int8_t __ret; \
  49569   int8x16_t __s0 = __p0; \
  49570   __ret = (int8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__s0, __p1); \
  49571   __ret; \
  49572 })
  49573 #else
  49574 #define vdupb_laneq_s8(__p0, __p1) __extension__ ({ \
  49575   int8_t __ret; \
  49576   int8x16_t __s0 = __p0; \
  49577   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49578   __ret = (int8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__rev0, __p1); \
  49579   __ret; \
  49580 })
  49581 #endif
  49582 
  49583 #ifdef __LITTLE_ENDIAN__
  49584 #define vdupd_laneq_f64(__p0, __p1) __extension__ ({ \
  49585   float64_t __ret; \
  49586   float64x2_t __s0 = __p0; \
  49587   __ret = (float64_t) __builtin_neon_vdupd_laneq_f64((float64x2_t)__s0, __p1); \
  49588   __ret; \
  49589 })
  49590 #else
  49591 #define vdupd_laneq_f64(__p0, __p1) __extension__ ({ \
  49592   float64_t __ret; \
  49593   float64x2_t __s0 = __p0; \
  49594   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  49595   __ret = (float64_t) __builtin_neon_vdupd_laneq_f64((float64x2_t)__rev0, __p1); \
  49596   __ret; \
  49597 })
  49598 #endif
  49599 
  49600 #ifdef __LITTLE_ENDIAN__
  49601 #define vdups_laneq_f32(__p0, __p1) __extension__ ({ \
  49602   float32_t __ret; \
  49603   float32x4_t __s0 = __p0; \
  49604   __ret = (float32_t) __builtin_neon_vdups_laneq_f32((float32x4_t)__s0, __p1); \
  49605   __ret; \
  49606 })
  49607 #else
  49608 #define vdups_laneq_f32(__p0, __p1) __extension__ ({ \
  49609   float32_t __ret; \
  49610   float32x4_t __s0 = __p0; \
  49611   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49612   __ret = (float32_t) __builtin_neon_vdups_laneq_f32((float32x4_t)__rev0, __p1); \
  49613   __ret; \
  49614 })
  49615 #endif
  49616 
  49617 #ifdef __LITTLE_ENDIAN__
  49618 #define vdups_laneq_s32(__p0, __p1) __extension__ ({ \
  49619   int32_t __ret; \
  49620   int32x4_t __s0 = __p0; \
  49621   __ret = (int32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__s0, __p1); \
  49622   __ret; \
  49623 })
  49624 #else
  49625 #define vdups_laneq_s32(__p0, __p1) __extension__ ({ \
  49626   int32_t __ret; \
  49627   int32x4_t __s0 = __p0; \
  49628   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  49629   __ret = (int32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__rev0, __p1); \
  49630   __ret; \
  49631 })
  49632 #endif
  49633 
  49634 #ifdef __LITTLE_ENDIAN__
  49635 #define vdupd_laneq_s64(__p0, __p1) __extension__ ({ \
  49636   int64_t __ret; \
  49637   int64x2_t __s0 = __p0; \
  49638   __ret = (int64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__s0, __p1); \
  49639   __ret; \
  49640 })
  49641 #else
  49642 #define vdupd_laneq_s64(__p0, __p1) __extension__ ({ \
  49643   int64_t __ret; \
  49644   int64x2_t __s0 = __p0; \
  49645   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  49646   __ret = (int64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__rev0, __p1); \
  49647   __ret; \
  49648 })
  49649 #endif
  49650 
  49651 #ifdef __LITTLE_ENDIAN__
  49652 #define vduph_laneq_s16(__p0, __p1) __extension__ ({ \
  49653   int16_t __ret; \
  49654   int16x8_t __s0 = __p0; \
  49655   __ret = (int16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__s0, __p1); \
  49656   __ret; \
  49657 })
  49658 #else
  49659 #define vduph_laneq_s16(__p0, __p1) __extension__ ({ \
  49660   int16_t __ret; \
  49661   int16x8_t __s0 = __p0; \
  49662   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49663   __ret = (int16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__rev0, __p1); \
  49664   __ret; \
  49665 })
  49666 #endif
  49667 
  49668 #ifdef __LITTLE_ENDIAN__
  49669 #define vduph_laneq_f16(__p0, __p1) __extension__ ({ \
  49670   float16_t __ret; \
  49671   float16x8_t __s0 = __p0; \
  49672   __ret = (float16_t) __builtin_neon_vduph_laneq_f16((float16x8_t)__s0, __p1); \
  49673   __ret; \
  49674 })
  49675 #else
  49676 #define vduph_laneq_f16(__p0, __p1) __extension__ ({ \
  49677   float16_t __ret; \
  49678   float16x8_t __s0 = __p0; \
  49679   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  49680   __ret = (float16_t) __builtin_neon_vduph_laneq_f16((float16x8_t)__rev0, __p1); \
  49681   __ret; \
  49682 })
  49683 #endif
  49684 
  49685 #ifdef __LITTLE_ENDIAN__
  49686 #define vdup_laneq_p8(__p0_370, __p1_370) __extension__ ({ \
  49687   poly8x8_t __ret_370; \
  49688   poly8x16_t __s0_370 = __p0_370; \
  49689   __ret_370 = splat_laneq_p8(__s0_370, __p1_370); \
  49690   __ret_370; \
  49691 })
  49692 #else
  49693 #define vdup_laneq_p8(__p0_371, __p1_371) __extension__ ({ \
  49694   poly8x8_t __ret_371; \
  49695   poly8x16_t __s0_371 = __p0_371; \
  49696   poly8x16_t __rev0_371;  __rev0_371 = __builtin_shufflevector(__s0_371, __s0_371, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49697   __ret_371 = __noswap_splat_laneq_p8(__rev0_371, __p1_371); \
  49698   __ret_371 = __builtin_shufflevector(__ret_371, __ret_371, 7, 6, 5, 4, 3, 2, 1, 0); \
  49699   __ret_371; \
  49700 })
  49701 #endif
  49702 
  49703 #ifdef __LITTLE_ENDIAN__
  49704 #define vdup_laneq_p64(__p0_372, __p1_372) __extension__ ({ \
  49705   poly64x1_t __ret_372; \
  49706   poly64x2_t __s0_372 = __p0_372; \
  49707   __ret_372 = splat_laneq_p64(__s0_372, __p1_372); \
  49708   __ret_372; \
  49709 })
  49710 #else
  49711 #define vdup_laneq_p64(__p0_373, __p1_373) __extension__ ({ \
  49712   poly64x1_t __ret_373; \
  49713   poly64x2_t __s0_373 = __p0_373; \
  49714   poly64x2_t __rev0_373;  __rev0_373 = __builtin_shufflevector(__s0_373, __s0_373, 1, 0); \
  49715   __ret_373 = __noswap_splat_laneq_p64(__rev0_373, __p1_373); \
  49716   __ret_373; \
  49717 })
  49718 #endif
  49719 
  49720 #ifdef __LITTLE_ENDIAN__
  49721 #define vdup_laneq_p16(__p0_374, __p1_374) __extension__ ({ \
  49722   poly16x4_t __ret_374; \
  49723   poly16x8_t __s0_374 = __p0_374; \
  49724   __ret_374 = splat_laneq_p16(__s0_374, __p1_374); \
  49725   __ret_374; \
  49726 })
  49727 #else
  49728 #define vdup_laneq_p16(__p0_375, __p1_375) __extension__ ({ \
  49729   poly16x4_t __ret_375; \
  49730   poly16x8_t __s0_375 = __p0_375; \
  49731   poly16x8_t __rev0_375;  __rev0_375 = __builtin_shufflevector(__s0_375, __s0_375, 7, 6, 5, 4, 3, 2, 1, 0); \
  49732   __ret_375 = __noswap_splat_laneq_p16(__rev0_375, __p1_375); \
  49733   __ret_375 = __builtin_shufflevector(__ret_375, __ret_375, 3, 2, 1, 0); \
  49734   __ret_375; \
  49735 })
  49736 #endif
  49737 
  49738 #ifdef __LITTLE_ENDIAN__
  49739 #define vdupq_laneq_p8(__p0_376, __p1_376) __extension__ ({ \
  49740   poly8x16_t __ret_376; \
  49741   poly8x16_t __s0_376 = __p0_376; \
  49742   __ret_376 = splatq_laneq_p8(__s0_376, __p1_376); \
  49743   __ret_376; \
  49744 })
  49745 #else
  49746 #define vdupq_laneq_p8(__p0_377, __p1_377) __extension__ ({ \
  49747   poly8x16_t __ret_377; \
  49748   poly8x16_t __s0_377 = __p0_377; \
  49749   poly8x16_t __rev0_377;  __rev0_377 = __builtin_shufflevector(__s0_377, __s0_377, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49750   __ret_377 = __noswap_splatq_laneq_p8(__rev0_377, __p1_377); \
  49751   __ret_377 = __builtin_shufflevector(__ret_377, __ret_377, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49752   __ret_377; \
  49753 })
  49754 #endif
  49755 
  49756 #ifdef __LITTLE_ENDIAN__
  49757 #define vdupq_laneq_p64(__p0_378, __p1_378) __extension__ ({ \
  49758   poly64x2_t __ret_378; \
  49759   poly64x2_t __s0_378 = __p0_378; \
  49760   __ret_378 = splatq_laneq_p64(__s0_378, __p1_378); \
  49761   __ret_378; \
  49762 })
  49763 #else
  49764 #define vdupq_laneq_p64(__p0_379, __p1_379) __extension__ ({ \
  49765   poly64x2_t __ret_379; \
  49766   poly64x2_t __s0_379 = __p0_379; \
  49767   poly64x2_t __rev0_379;  __rev0_379 = __builtin_shufflevector(__s0_379, __s0_379, 1, 0); \
  49768   __ret_379 = __noswap_splatq_laneq_p64(__rev0_379, __p1_379); \
  49769   __ret_379 = __builtin_shufflevector(__ret_379, __ret_379, 1, 0); \
  49770   __ret_379; \
  49771 })
  49772 #endif
  49773 
  49774 #ifdef __LITTLE_ENDIAN__
  49775 #define vdupq_laneq_p16(__p0_380, __p1_380) __extension__ ({ \
  49776   poly16x8_t __ret_380; \
  49777   poly16x8_t __s0_380 = __p0_380; \
  49778   __ret_380 = splatq_laneq_p16(__s0_380, __p1_380); \
  49779   __ret_380; \
  49780 })
  49781 #else
  49782 #define vdupq_laneq_p16(__p0_381, __p1_381) __extension__ ({ \
  49783   poly16x8_t __ret_381; \
  49784   poly16x8_t __s0_381 = __p0_381; \
  49785   poly16x8_t __rev0_381;  __rev0_381 = __builtin_shufflevector(__s0_381, __s0_381, 7, 6, 5, 4, 3, 2, 1, 0); \
  49786   __ret_381 = __noswap_splatq_laneq_p16(__rev0_381, __p1_381); \
  49787   __ret_381 = __builtin_shufflevector(__ret_381, __ret_381, 7, 6, 5, 4, 3, 2, 1, 0); \
  49788   __ret_381; \
  49789 })
  49790 #endif
  49791 
  49792 #ifdef __LITTLE_ENDIAN__
  49793 #define vdupq_laneq_u8(__p0_382, __p1_382) __extension__ ({ \
  49794   uint8x16_t __ret_382; \
  49795   uint8x16_t __s0_382 = __p0_382; \
  49796   __ret_382 = splatq_laneq_u8(__s0_382, __p1_382); \
  49797   __ret_382; \
  49798 })
  49799 #else
  49800 #define vdupq_laneq_u8(__p0_383, __p1_383) __extension__ ({ \
  49801   uint8x16_t __ret_383; \
  49802   uint8x16_t __s0_383 = __p0_383; \
  49803   uint8x16_t __rev0_383;  __rev0_383 = __builtin_shufflevector(__s0_383, __s0_383, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49804   __ret_383 = __noswap_splatq_laneq_u8(__rev0_383, __p1_383); \
  49805   __ret_383 = __builtin_shufflevector(__ret_383, __ret_383, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49806   __ret_383; \
  49807 })
  49808 #endif
  49809 
  49810 #ifdef __LITTLE_ENDIAN__
  49811 #define vdupq_laneq_u32(__p0_384, __p1_384) __extension__ ({ \
  49812   uint32x4_t __ret_384; \
  49813   uint32x4_t __s0_384 = __p0_384; \
  49814   __ret_384 = splatq_laneq_u32(__s0_384, __p1_384); \
  49815   __ret_384; \
  49816 })
  49817 #else
  49818 #define vdupq_laneq_u32(__p0_385, __p1_385) __extension__ ({ \
  49819   uint32x4_t __ret_385; \
  49820   uint32x4_t __s0_385 = __p0_385; \
  49821   uint32x4_t __rev0_385;  __rev0_385 = __builtin_shufflevector(__s0_385, __s0_385, 3, 2, 1, 0); \
  49822   __ret_385 = __noswap_splatq_laneq_u32(__rev0_385, __p1_385); \
  49823   __ret_385 = __builtin_shufflevector(__ret_385, __ret_385, 3, 2, 1, 0); \
  49824   __ret_385; \
  49825 })
  49826 #endif
  49827 
  49828 #ifdef __LITTLE_ENDIAN__
  49829 #define vdupq_laneq_u64(__p0_386, __p1_386) __extension__ ({ \
  49830   uint64x2_t __ret_386; \
  49831   uint64x2_t __s0_386 = __p0_386; \
  49832   __ret_386 = splatq_laneq_u64(__s0_386, __p1_386); \
  49833   __ret_386; \
  49834 })
  49835 #else
  49836 #define vdupq_laneq_u64(__p0_387, __p1_387) __extension__ ({ \
  49837   uint64x2_t __ret_387; \
  49838   uint64x2_t __s0_387 = __p0_387; \
  49839   uint64x2_t __rev0_387;  __rev0_387 = __builtin_shufflevector(__s0_387, __s0_387, 1, 0); \
  49840   __ret_387 = __noswap_splatq_laneq_u64(__rev0_387, __p1_387); \
  49841   __ret_387 = __builtin_shufflevector(__ret_387, __ret_387, 1, 0); \
  49842   __ret_387; \
  49843 })
  49844 #endif
  49845 
  49846 #ifdef __LITTLE_ENDIAN__
  49847 #define vdupq_laneq_u16(__p0_388, __p1_388) __extension__ ({ \
  49848   uint16x8_t __ret_388; \
  49849   uint16x8_t __s0_388 = __p0_388; \
  49850   __ret_388 = splatq_laneq_u16(__s0_388, __p1_388); \
  49851   __ret_388; \
  49852 })
  49853 #else
  49854 #define vdupq_laneq_u16(__p0_389, __p1_389) __extension__ ({ \
  49855   uint16x8_t __ret_389; \
  49856   uint16x8_t __s0_389 = __p0_389; \
  49857   uint16x8_t __rev0_389;  __rev0_389 = __builtin_shufflevector(__s0_389, __s0_389, 7, 6, 5, 4, 3, 2, 1, 0); \
  49858   __ret_389 = __noswap_splatq_laneq_u16(__rev0_389, __p1_389); \
  49859   __ret_389 = __builtin_shufflevector(__ret_389, __ret_389, 7, 6, 5, 4, 3, 2, 1, 0); \
  49860   __ret_389; \
  49861 })
  49862 #endif
  49863 
  49864 #ifdef __LITTLE_ENDIAN__
  49865 #define vdupq_laneq_s8(__p0_390, __p1_390) __extension__ ({ \
  49866   int8x16_t __ret_390; \
  49867   int8x16_t __s0_390 = __p0_390; \
  49868   __ret_390 = splatq_laneq_s8(__s0_390, __p1_390); \
  49869   __ret_390; \
  49870 })
  49871 #else
  49872 #define vdupq_laneq_s8(__p0_391, __p1_391) __extension__ ({ \
  49873   int8x16_t __ret_391; \
  49874   int8x16_t __s0_391 = __p0_391; \
  49875   int8x16_t __rev0_391;  __rev0_391 = __builtin_shufflevector(__s0_391, __s0_391, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49876   __ret_391 = __noswap_splatq_laneq_s8(__rev0_391, __p1_391); \
  49877   __ret_391 = __builtin_shufflevector(__ret_391, __ret_391, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  49878   __ret_391; \
  49879 })
  49880 #endif
  49881 
  49882 #ifdef __LITTLE_ENDIAN__
  49883 #define vdupq_laneq_f64(__p0_392, __p1_392) __extension__ ({ \
  49884   float64x2_t __ret_392; \
  49885   float64x2_t __s0_392 = __p0_392; \
  49886   __ret_392 = splatq_laneq_f64(__s0_392, __p1_392); \
  49887   __ret_392; \
  49888 })
  49889 #else
  49890 #define vdupq_laneq_f64(__p0_393, __p1_393) __extension__ ({ \
  49891   float64x2_t __ret_393; \
  49892   float64x2_t __s0_393 = __p0_393; \
  49893   float64x2_t __rev0_393;  __rev0_393 = __builtin_shufflevector(__s0_393, __s0_393, 1, 0); \
  49894   __ret_393 = __noswap_splatq_laneq_f64(__rev0_393, __p1_393); \
  49895   __ret_393 = __builtin_shufflevector(__ret_393, __ret_393, 1, 0); \
  49896   __ret_393; \
  49897 })
  49898 #endif
  49899 
  49900 #ifdef __LITTLE_ENDIAN__
  49901 #define vdupq_laneq_f32(__p0_394, __p1_394) __extension__ ({ \
  49902   float32x4_t __ret_394; \
  49903   float32x4_t __s0_394 = __p0_394; \
  49904   __ret_394 = splatq_laneq_f32(__s0_394, __p1_394); \
  49905   __ret_394; \
  49906 })
  49907 #else
  49908 #define vdupq_laneq_f32(__p0_395, __p1_395) __extension__ ({ \
  49909   float32x4_t __ret_395; \
  49910   float32x4_t __s0_395 = __p0_395; \
  49911   float32x4_t __rev0_395;  __rev0_395 = __builtin_shufflevector(__s0_395, __s0_395, 3, 2, 1, 0); \
  49912   __ret_395 = __noswap_splatq_laneq_f32(__rev0_395, __p1_395); \
  49913   __ret_395 = __builtin_shufflevector(__ret_395, __ret_395, 3, 2, 1, 0); \
  49914   __ret_395; \
  49915 })
  49916 #endif
  49917 
  49918 #ifdef __LITTLE_ENDIAN__
  49919 #define vdupq_laneq_f16(__p0_396, __p1_396) __extension__ ({ \
  49920   float16x8_t __ret_396; \
  49921   float16x8_t __s0_396 = __p0_396; \
  49922   __ret_396 = splatq_laneq_f16(__s0_396, __p1_396); \
  49923   __ret_396; \
  49924 })
  49925 #else
  49926 #define vdupq_laneq_f16(__p0_397, __p1_397) __extension__ ({ \
  49927   float16x8_t __ret_397; \
  49928   float16x8_t __s0_397 = __p0_397; \
  49929   float16x8_t __rev0_397;  __rev0_397 = __builtin_shufflevector(__s0_397, __s0_397, 7, 6, 5, 4, 3, 2, 1, 0); \
  49930   __ret_397 = __noswap_splatq_laneq_f16(__rev0_397, __p1_397); \
  49931   __ret_397 = __builtin_shufflevector(__ret_397, __ret_397, 7, 6, 5, 4, 3, 2, 1, 0); \
  49932   __ret_397; \
  49933 })
  49934 #endif
  49935 
  49936 #ifdef __LITTLE_ENDIAN__
  49937 #define vdupq_laneq_s32(__p0_398, __p1_398) __extension__ ({ \
  49938   int32x4_t __ret_398; \
  49939   int32x4_t __s0_398 = __p0_398; \
  49940   __ret_398 = splatq_laneq_s32(__s0_398, __p1_398); \
  49941   __ret_398; \
  49942 })
  49943 #else
  49944 #define vdupq_laneq_s32(__p0_399, __p1_399) __extension__ ({ \
  49945   int32x4_t __ret_399; \
  49946   int32x4_t __s0_399 = __p0_399; \
  49947   int32x4_t __rev0_399;  __rev0_399 = __builtin_shufflevector(__s0_399, __s0_399, 3, 2, 1, 0); \
  49948   __ret_399 = __noswap_splatq_laneq_s32(__rev0_399, __p1_399); \
  49949   __ret_399 = __builtin_shufflevector(__ret_399, __ret_399, 3, 2, 1, 0); \
  49950   __ret_399; \
  49951 })
  49952 #endif
  49953 
  49954 #ifdef __LITTLE_ENDIAN__
  49955 #define vdupq_laneq_s64(__p0_400, __p1_400) __extension__ ({ \
  49956   int64x2_t __ret_400; \
  49957   int64x2_t __s0_400 = __p0_400; \
  49958   __ret_400 = splatq_laneq_s64(__s0_400, __p1_400); \
  49959   __ret_400; \
  49960 })
  49961 #else
  49962 #define vdupq_laneq_s64(__p0_401, __p1_401) __extension__ ({ \
  49963   int64x2_t __ret_401; \
  49964   int64x2_t __s0_401 = __p0_401; \
  49965   int64x2_t __rev0_401;  __rev0_401 = __builtin_shufflevector(__s0_401, __s0_401, 1, 0); \
  49966   __ret_401 = __noswap_splatq_laneq_s64(__rev0_401, __p1_401); \
  49967   __ret_401 = __builtin_shufflevector(__ret_401, __ret_401, 1, 0); \
  49968   __ret_401; \
  49969 })
  49970 #endif
  49971 
  49972 #ifdef __LITTLE_ENDIAN__
  49973 #define vdupq_laneq_s16(__p0_402, __p1_402) __extension__ ({ \
  49974   int16x8_t __ret_402; \
  49975   int16x8_t __s0_402 = __p0_402; \
  49976   __ret_402 = splatq_laneq_s16(__s0_402, __p1_402); \
  49977   __ret_402; \
  49978 })
  49979 #else
  49980 #define vdupq_laneq_s16(__p0_403, __p1_403) __extension__ ({ \
  49981   int16x8_t __ret_403; \
  49982   int16x8_t __s0_403 = __p0_403; \
  49983   int16x8_t __rev0_403;  __rev0_403 = __builtin_shufflevector(__s0_403, __s0_403, 7, 6, 5, 4, 3, 2, 1, 0); \
  49984   __ret_403 = __noswap_splatq_laneq_s16(__rev0_403, __p1_403); \
  49985   __ret_403 = __builtin_shufflevector(__ret_403, __ret_403, 7, 6, 5, 4, 3, 2, 1, 0); \
  49986   __ret_403; \
  49987 })
  49988 #endif
  49989 
  49990 #ifdef __LITTLE_ENDIAN__
  49991 #define vdup_laneq_u8(__p0_404, __p1_404) __extension__ ({ \
  49992   uint8x8_t __ret_404; \
  49993   uint8x16_t __s0_404 = __p0_404; \
  49994   __ret_404 = splat_laneq_u8(__s0_404, __p1_404); \
  49995   __ret_404; \
  49996 })
  49997 #else
  49998 #define vdup_laneq_u8(__p0_405, __p1_405) __extension__ ({ \
  49999   uint8x8_t __ret_405; \
  50000   uint8x16_t __s0_405 = __p0_405; \
  50001   uint8x16_t __rev0_405;  __rev0_405 = __builtin_shufflevector(__s0_405, __s0_405, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  50002   __ret_405 = __noswap_splat_laneq_u8(__rev0_405, __p1_405); \
  50003   __ret_405 = __builtin_shufflevector(__ret_405, __ret_405, 7, 6, 5, 4, 3, 2, 1, 0); \
  50004   __ret_405; \
  50005 })
  50006 #endif
  50007 
  50008 #ifdef __LITTLE_ENDIAN__
  50009 #define vdup_laneq_u32(__p0_406, __p1_406) __extension__ ({ \
  50010   uint32x2_t __ret_406; \
  50011   uint32x4_t __s0_406 = __p0_406; \
  50012   __ret_406 = splat_laneq_u32(__s0_406, __p1_406); \
  50013   __ret_406; \
  50014 })
  50015 #else
  50016 #define vdup_laneq_u32(__p0_407, __p1_407) __extension__ ({ \
  50017   uint32x2_t __ret_407; \
  50018   uint32x4_t __s0_407 = __p0_407; \
  50019   uint32x4_t __rev0_407;  __rev0_407 = __builtin_shufflevector(__s0_407, __s0_407, 3, 2, 1, 0); \
  50020   __ret_407 = __noswap_splat_laneq_u32(__rev0_407, __p1_407); \
  50021   __ret_407 = __builtin_shufflevector(__ret_407, __ret_407, 1, 0); \
  50022   __ret_407; \
  50023 })
  50024 #endif
  50025 
  50026 #ifdef __LITTLE_ENDIAN__
  50027 #define vdup_laneq_u64(__p0_408, __p1_408) __extension__ ({ \
  50028   uint64x1_t __ret_408; \
  50029   uint64x2_t __s0_408 = __p0_408; \
  50030   __ret_408 = splat_laneq_u64(__s0_408, __p1_408); \
  50031   __ret_408; \
  50032 })
  50033 #else
  50034 #define vdup_laneq_u64(__p0_409, __p1_409) __extension__ ({ \
  50035   uint64x1_t __ret_409; \
  50036   uint64x2_t __s0_409 = __p0_409; \
  50037   uint64x2_t __rev0_409;  __rev0_409 = __builtin_shufflevector(__s0_409, __s0_409, 1, 0); \
  50038   __ret_409 = __noswap_splat_laneq_u64(__rev0_409, __p1_409); \
  50039   __ret_409; \
  50040 })
  50041 #endif
  50042 
  50043 #ifdef __LITTLE_ENDIAN__
  50044 #define vdup_laneq_u16(__p0_410, __p1_410) __extension__ ({ \
  50045   uint16x4_t __ret_410; \
  50046   uint16x8_t __s0_410 = __p0_410; \
  50047   __ret_410 = splat_laneq_u16(__s0_410, __p1_410); \
  50048   __ret_410; \
  50049 })
  50050 #else
  50051 #define vdup_laneq_u16(__p0_411, __p1_411) __extension__ ({ \
  50052   uint16x4_t __ret_411; \
  50053   uint16x8_t __s0_411 = __p0_411; \
  50054   uint16x8_t __rev0_411;  __rev0_411 = __builtin_shufflevector(__s0_411, __s0_411, 7, 6, 5, 4, 3, 2, 1, 0); \
  50055   __ret_411 = __noswap_splat_laneq_u16(__rev0_411, __p1_411); \
  50056   __ret_411 = __builtin_shufflevector(__ret_411, __ret_411, 3, 2, 1, 0); \
  50057   __ret_411; \
  50058 })
  50059 #endif
  50060 
  50061 #ifdef __LITTLE_ENDIAN__
  50062 #define vdup_laneq_s8(__p0_412, __p1_412) __extension__ ({ \
  50063   int8x8_t __ret_412; \
  50064   int8x16_t __s0_412 = __p0_412; \
  50065   __ret_412 = splat_laneq_s8(__s0_412, __p1_412); \
  50066   __ret_412; \
  50067 })
  50068 #else
  50069 #define vdup_laneq_s8(__p0_413, __p1_413) __extension__ ({ \
  50070   int8x8_t __ret_413; \
  50071   int8x16_t __s0_413 = __p0_413; \
  50072   int8x16_t __rev0_413;  __rev0_413 = __builtin_shufflevector(__s0_413, __s0_413, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  50073   __ret_413 = __noswap_splat_laneq_s8(__rev0_413, __p1_413); \
  50074   __ret_413 = __builtin_shufflevector(__ret_413, __ret_413, 7, 6, 5, 4, 3, 2, 1, 0); \
  50075   __ret_413; \
  50076 })
  50077 #endif
  50078 
  50079 #ifdef __LITTLE_ENDIAN__
  50080 #define vdup_laneq_f64(__p0_414, __p1_414) __extension__ ({ \
  50081   float64x1_t __ret_414; \
  50082   float64x2_t __s0_414 = __p0_414; \
  50083   __ret_414 = splat_laneq_f64(__s0_414, __p1_414); \
  50084   __ret_414; \
  50085 })
  50086 #else
  50087 #define vdup_laneq_f64(__p0_415, __p1_415) __extension__ ({ \
  50088   float64x1_t __ret_415; \
  50089   float64x2_t __s0_415 = __p0_415; \
  50090   float64x2_t __rev0_415;  __rev0_415 = __builtin_shufflevector(__s0_415, __s0_415, 1, 0); \
  50091   __ret_415 = __noswap_splat_laneq_f64(__rev0_415, __p1_415); \
  50092   __ret_415; \
  50093 })
  50094 #endif
  50095 
  50096 #ifdef __LITTLE_ENDIAN__
  50097 #define vdup_laneq_f32(__p0_416, __p1_416) __extension__ ({ \
  50098   float32x2_t __ret_416; \
  50099   float32x4_t __s0_416 = __p0_416; \
  50100   __ret_416 = splat_laneq_f32(__s0_416, __p1_416); \
  50101   __ret_416; \
  50102 })
  50103 #else
  50104 #define vdup_laneq_f32(__p0_417, __p1_417) __extension__ ({ \
  50105   float32x2_t __ret_417; \
  50106   float32x4_t __s0_417 = __p0_417; \
  50107   float32x4_t __rev0_417;  __rev0_417 = __builtin_shufflevector(__s0_417, __s0_417, 3, 2, 1, 0); \
  50108   __ret_417 = __noswap_splat_laneq_f32(__rev0_417, __p1_417); \
  50109   __ret_417 = __builtin_shufflevector(__ret_417, __ret_417, 1, 0); \
  50110   __ret_417; \
  50111 })
  50112 #endif
  50113 
  50114 #ifdef __LITTLE_ENDIAN__
  50115 #define vdup_laneq_f16(__p0_418, __p1_418) __extension__ ({ \
  50116   float16x4_t __ret_418; \
  50117   float16x8_t __s0_418 = __p0_418; \
  50118   __ret_418 = splat_laneq_f16(__s0_418, __p1_418); \
  50119   __ret_418; \
  50120 })
  50121 #else
  50122 #define vdup_laneq_f16(__p0_419, __p1_419) __extension__ ({ \
  50123   float16x4_t __ret_419; \
  50124   float16x8_t __s0_419 = __p0_419; \
  50125   float16x8_t __rev0_419;  __rev0_419 = __builtin_shufflevector(__s0_419, __s0_419, 7, 6, 5, 4, 3, 2, 1, 0); \
  50126   __ret_419 = __noswap_splat_laneq_f16(__rev0_419, __p1_419); \
  50127   __ret_419 = __builtin_shufflevector(__ret_419, __ret_419, 3, 2, 1, 0); \
  50128   __ret_419; \
  50129 })
  50130 #endif
  50131 
  50132 #ifdef __LITTLE_ENDIAN__
  50133 #define vdup_laneq_s32(__p0_420, __p1_420) __extension__ ({ \
  50134   int32x2_t __ret_420; \
  50135   int32x4_t __s0_420 = __p0_420; \
  50136   __ret_420 = splat_laneq_s32(__s0_420, __p1_420); \
  50137   __ret_420; \
  50138 })
  50139 #else
  50140 #define vdup_laneq_s32(__p0_421, __p1_421) __extension__ ({ \
  50141   int32x2_t __ret_421; \
  50142   int32x4_t __s0_421 = __p0_421; \
  50143   int32x4_t __rev0_421;  __rev0_421 = __builtin_shufflevector(__s0_421, __s0_421, 3, 2, 1, 0); \
  50144   __ret_421 = __noswap_splat_laneq_s32(__rev0_421, __p1_421); \
  50145   __ret_421 = __builtin_shufflevector(__ret_421, __ret_421, 1, 0); \
  50146   __ret_421; \
  50147 })
  50148 #endif
  50149 
  50150 #ifdef __LITTLE_ENDIAN__
  50151 #define vdup_laneq_s64(__p0_422, __p1_422) __extension__ ({ \
  50152   int64x1_t __ret_422; \
  50153   int64x2_t __s0_422 = __p0_422; \
  50154   __ret_422 = splat_laneq_s64(__s0_422, __p1_422); \
  50155   __ret_422; \
  50156 })
  50157 #else
  50158 #define vdup_laneq_s64(__p0_423, __p1_423) __extension__ ({ \
  50159   int64x1_t __ret_423; \
  50160   int64x2_t __s0_423 = __p0_423; \
  50161   int64x2_t __rev0_423;  __rev0_423 = __builtin_shufflevector(__s0_423, __s0_423, 1, 0); \
  50162   __ret_423 = __noswap_splat_laneq_s64(__rev0_423, __p1_423); \
  50163   __ret_423; \
  50164 })
  50165 #endif
  50166 
  50167 #ifdef __LITTLE_ENDIAN__
  50168 #define vdup_laneq_s16(__p0_424, __p1_424) __extension__ ({ \
  50169   int16x4_t __ret_424; \
  50170   int16x8_t __s0_424 = __p0_424; \
  50171   __ret_424 = splat_laneq_s16(__s0_424, __p1_424); \
  50172   __ret_424; \
  50173 })
  50174 #else
  50175 #define vdup_laneq_s16(__p0_425, __p1_425) __extension__ ({ \
  50176   int16x4_t __ret_425; \
  50177   int16x8_t __s0_425 = __p0_425; \
  50178   int16x8_t __rev0_425;  __rev0_425 = __builtin_shufflevector(__s0_425, __s0_425, 7, 6, 5, 4, 3, 2, 1, 0); \
  50179   __ret_425 = __noswap_splat_laneq_s16(__rev0_425, __p1_425); \
  50180   __ret_425 = __builtin_shufflevector(__ret_425, __ret_425, 3, 2, 1, 0); \
  50181   __ret_425; \
  50182 })
  50183 #endif
  50184 
  50185 __ai __attribute__((target("neon"))) poly64x1_t vdup_n_p64(poly64_t __p0) {
  50186   poly64x1_t __ret;
  50187   __ret = (poly64x1_t) {__p0};
  50188   return __ret;
  50189 }
  50190 #ifdef __LITTLE_ENDIAN__
  50191 __ai __attribute__((target("neon"))) poly64x2_t vdupq_n_p64(poly64_t __p0) {
  50192   poly64x2_t __ret;
  50193   __ret = (poly64x2_t) {__p0, __p0};
  50194   return __ret;
  50195 }
  50196 #else
  50197 __ai __attribute__((target("neon"))) poly64x2_t vdupq_n_p64(poly64_t __p0) {
  50198   poly64x2_t __ret;
  50199   __ret = (poly64x2_t) {__p0, __p0};
  50200   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50201   return __ret;
  50202 }
  50203 #endif
  50204 
  50205 #ifdef __LITTLE_ENDIAN__
  50206 __ai __attribute__((target("neon"))) float64x2_t vdupq_n_f64(float64_t __p0) {
  50207   float64x2_t __ret;
  50208   __ret = (float64x2_t) {__p0, __p0};
  50209   return __ret;
  50210 }
  50211 #else
  50212 __ai __attribute__((target("neon"))) float64x2_t vdupq_n_f64(float64_t __p0) {
  50213   float64x2_t __ret;
  50214   __ret = (float64x2_t) {__p0, __p0};
  50215   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50216   return __ret;
  50217 }
  50218 #endif
  50219 
  50220 __ai __attribute__((target("neon"))) float64x1_t vdup_n_f64(float64_t __p0) {
  50221   float64x1_t __ret;
  50222   __ret = (float64x1_t) {__p0};
  50223   return __ret;
  50224 }
  50225 #define vext_p64(__p0, __p1, __p2) __extension__ ({ \
  50226   poly64x1_t __ret; \
  50227   poly64x1_t __s0 = __p0; \
  50228   poly64x1_t __s1 = __p1; \
  50229   __ret = (poly64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 6); \
  50230   __ret; \
  50231 })
  50232 #ifdef __LITTLE_ENDIAN__
  50233 #define vextq_p64(__p0, __p1, __p2) __extension__ ({ \
  50234   poly64x2_t __ret; \
  50235   poly64x2_t __s0 = __p0; \
  50236   poly64x2_t __s1 = __p1; \
  50237   __ret = (poly64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 38); \
  50238   __ret; \
  50239 })
  50240 #else
  50241 #define vextq_p64(__p0, __p1, __p2) __extension__ ({ \
  50242   poly64x2_t __ret; \
  50243   poly64x2_t __s0 = __p0; \
  50244   poly64x2_t __s1 = __p1; \
  50245   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  50246   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  50247   __ret = (poly64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 38); \
  50248   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  50249   __ret; \
  50250 })
  50251 #endif
  50252 
  50253 #ifdef __LITTLE_ENDIAN__
  50254 #define vextq_f64(__p0, __p1, __p2) __extension__ ({ \
  50255   float64x2_t __ret; \
  50256   float64x2_t __s0 = __p0; \
  50257   float64x2_t __s1 = __p1; \
  50258   __ret = (float64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 42); \
  50259   __ret; \
  50260 })
  50261 #else
  50262 #define vextq_f64(__p0, __p1, __p2) __extension__ ({ \
  50263   float64x2_t __ret; \
  50264   float64x2_t __s0 = __p0; \
  50265   float64x2_t __s1 = __p1; \
  50266   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  50267   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  50268   __ret = (float64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 42); \
  50269   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  50270   __ret; \
  50271 })
  50272 #endif
  50273 
  50274 #define vext_f64(__p0, __p1, __p2) __extension__ ({ \
  50275   float64x1_t __ret; \
  50276   float64x1_t __s0 = __p0; \
  50277   float64x1_t __s1 = __p1; \
  50278   __ret = (float64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 10); \
  50279   __ret; \
  50280 })
  50281 #ifdef __LITTLE_ENDIAN__
  50282 __ai __attribute__((target("neon"))) float64x2_t vfmaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  50283   float64x2_t __ret;
  50284   __ret = (float64x2_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  50285   return __ret;
  50286 }
  50287 #else
  50288 __ai __attribute__((target("neon"))) float64x2_t vfmaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  50289   float64x2_t __ret;
  50290   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  50291   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  50292   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  50293   __ret = (float64x2_t) __builtin_neon_vfmaq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42);
  50294   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50295   return __ret;
  50296 }
  50297 __ai __attribute__((target("neon"))) float64x2_t __noswap_vfmaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  50298   float64x2_t __ret;
  50299   __ret = (float64x2_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  50300   return __ret;
  50301 }
  50302 #endif
  50303 
  50304 __ai __attribute__((target("neon"))) float64x1_t vfma_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) {
  50305   float64x1_t __ret;
  50306   __ret = (float64x1_t) __builtin_neon_vfma_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 10);
  50307   return __ret;
  50308 }
  50309 #define vfmad_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50310   float64_t __ret; \
  50311   float64_t __s0 = __p0; \
  50312   float64_t __s1 = __p1; \
  50313   float64x1_t __s2 = __p2; \
  50314   __ret = (float64_t) __builtin_neon_vfmad_lane_f64(__s0, __s1, (float64x1_t)__s2, __p3); \
  50315   __ret; \
  50316 })
  50317 #ifdef __LITTLE_ENDIAN__
  50318 #define vfmas_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50319   float32_t __ret; \
  50320   float32_t __s0 = __p0; \
  50321   float32_t __s1 = __p1; \
  50322   float32x2_t __s2 = __p2; \
  50323   __ret = (float32_t) __builtin_neon_vfmas_lane_f32(__s0, __s1, (float32x2_t)__s2, __p3); \
  50324   __ret; \
  50325 })
  50326 #else
  50327 #define vfmas_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50328   float32_t __ret; \
  50329   float32_t __s0 = __p0; \
  50330   float32_t __s1 = __p1; \
  50331   float32x2_t __s2 = __p2; \
  50332   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  50333   __ret = (float32_t) __builtin_neon_vfmas_lane_f32(__s0, __s1, (float32x2_t)__rev2, __p3); \
  50334   __ret; \
  50335 })
  50336 #define __noswap_vfmas_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50337   float32_t __ret; \
  50338   float32_t __s0 = __p0; \
  50339   float32_t __s1 = __p1; \
  50340   float32x2_t __s2 = __p2; \
  50341   __ret = (float32_t) __builtin_neon_vfmas_lane_f32(__s0, __s1, (float32x2_t)__s2, __p3); \
  50342   __ret; \
  50343 })
  50344 #endif
  50345 
  50346 #ifdef __LITTLE_ENDIAN__
  50347 #define vfmaq_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50348   float64x2_t __ret; \
  50349   float64x2_t __s0 = __p0; \
  50350   float64x2_t __s1 = __p1; \
  50351   float64x1_t __s2 = __p2; \
  50352   __ret = (float64x2_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 42); \
  50353   __ret; \
  50354 })
  50355 #else
  50356 #define vfmaq_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50357   float64x2_t __ret; \
  50358   float64x2_t __s0 = __p0; \
  50359   float64x2_t __s1 = __p1; \
  50360   float64x1_t __s2 = __p2; \
  50361   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  50362   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  50363   __ret = (float64x2_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__s2, __p3, 42); \
  50364   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  50365   __ret; \
  50366 })
  50367 #define __noswap_vfmaq_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50368   float64x2_t __ret; \
  50369   float64x2_t __s0 = __p0; \
  50370   float64x2_t __s1 = __p1; \
  50371   float64x1_t __s2 = __p2; \
  50372   __ret = (float64x2_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 42); \
  50373   __ret; \
  50374 })
  50375 #endif
  50376 
  50377 #ifdef __LITTLE_ENDIAN__
  50378 #define vfmaq_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50379   float32x4_t __ret; \
  50380   float32x4_t __s0 = __p0; \
  50381   float32x4_t __s1 = __p1; \
  50382   float32x2_t __s2 = __p2; \
  50383   __ret = (float32x4_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 41); \
  50384   __ret; \
  50385 })
  50386 #else
  50387 #define vfmaq_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50388   float32x4_t __ret; \
  50389   float32x4_t __s0 = __p0; \
  50390   float32x4_t __s1 = __p1; \
  50391   float32x2_t __s2 = __p2; \
  50392   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  50393   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  50394   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  50395   __ret = (float32x4_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, __p3, 41); \
  50396   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  50397   __ret; \
  50398 })
  50399 #define __noswap_vfmaq_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50400   float32x4_t __ret; \
  50401   float32x4_t __s0 = __p0; \
  50402   float32x4_t __s1 = __p1; \
  50403   float32x2_t __s2 = __p2; \
  50404   __ret = (float32x4_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 41); \
  50405   __ret; \
  50406 })
  50407 #endif
  50408 
  50409 #define vfma_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50410   float64x1_t __ret; \
  50411   float64x1_t __s0 = __p0; \
  50412   float64x1_t __s1 = __p1; \
  50413   float64x1_t __s2 = __p2; \
  50414   __ret = (float64x1_t) __builtin_neon_vfma_lane_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 10); \
  50415   __ret; \
  50416 })
  50417 #ifdef __LITTLE_ENDIAN__
  50418 #define vfma_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50419   float32x2_t __ret; \
  50420   float32x2_t __s0 = __p0; \
  50421   float32x2_t __s1 = __p1; \
  50422   float32x2_t __s2 = __p2; \
  50423   __ret = (float32x2_t) __builtin_neon_vfma_lane_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 9); \
  50424   __ret; \
  50425 })
  50426 #else
  50427 #define vfma_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50428   float32x2_t __ret; \
  50429   float32x2_t __s0 = __p0; \
  50430   float32x2_t __s1 = __p1; \
  50431   float32x2_t __s2 = __p2; \
  50432   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  50433   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  50434   float32x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  50435   __ret = (float32x2_t) __builtin_neon_vfma_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, __p3, 9); \
  50436   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  50437   __ret; \
  50438 })
  50439 #define __noswap_vfma_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50440   float32x2_t __ret; \
  50441   float32x2_t __s0 = __p0; \
  50442   float32x2_t __s1 = __p1; \
  50443   float32x2_t __s2 = __p2; \
  50444   __ret = (float32x2_t) __builtin_neon_vfma_lane_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 9); \
  50445   __ret; \
  50446 })
  50447 #endif
  50448 
  50449 #ifdef __LITTLE_ENDIAN__
  50450 #define vfmad_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50451   float64_t __ret; \
  50452   float64_t __s0 = __p0; \
  50453   float64_t __s1 = __p1; \
  50454   float64x2_t __s2 = __p2; \
  50455   __ret = (float64_t) __builtin_neon_vfmad_laneq_f64(__s0, __s1, (float64x2_t)__s2, __p3); \
  50456   __ret; \
  50457 })
  50458 #else
  50459 #define vfmad_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50460   float64_t __ret; \
  50461   float64_t __s0 = __p0; \
  50462   float64_t __s1 = __p1; \
  50463   float64x2_t __s2 = __p2; \
  50464   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  50465   __ret = (float64_t) __builtin_neon_vfmad_laneq_f64(__s0, __s1, (float64x2_t)__rev2, __p3); \
  50466   __ret; \
  50467 })
  50468 #define __noswap_vfmad_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50469   float64_t __ret; \
  50470   float64_t __s0 = __p0; \
  50471   float64_t __s1 = __p1; \
  50472   float64x2_t __s2 = __p2; \
  50473   __ret = (float64_t) __builtin_neon_vfmad_laneq_f64(__s0, __s1, (float64x2_t)__s2, __p3); \
  50474   __ret; \
  50475 })
  50476 #endif
  50477 
  50478 #ifdef __LITTLE_ENDIAN__
  50479 #define vfmas_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50480   float32_t __ret; \
  50481   float32_t __s0 = __p0; \
  50482   float32_t __s1 = __p1; \
  50483   float32x4_t __s2 = __p2; \
  50484   __ret = (float32_t) __builtin_neon_vfmas_laneq_f32(__s0, __s1, (float32x4_t)__s2, __p3); \
  50485   __ret; \
  50486 })
  50487 #else
  50488 #define vfmas_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50489   float32_t __ret; \
  50490   float32_t __s0 = __p0; \
  50491   float32_t __s1 = __p1; \
  50492   float32x4_t __s2 = __p2; \
  50493   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  50494   __ret = (float32_t) __builtin_neon_vfmas_laneq_f32(__s0, __s1, (float32x4_t)__rev2, __p3); \
  50495   __ret; \
  50496 })
  50497 #define __noswap_vfmas_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50498   float32_t __ret; \
  50499   float32_t __s0 = __p0; \
  50500   float32_t __s1 = __p1; \
  50501   float32x4_t __s2 = __p2; \
  50502   __ret = (float32_t) __builtin_neon_vfmas_laneq_f32(__s0, __s1, (float32x4_t)__s2, __p3); \
  50503   __ret; \
  50504 })
  50505 #endif
  50506 
  50507 #ifdef __LITTLE_ENDIAN__
  50508 #define vfmaq_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50509   float64x2_t __ret; \
  50510   float64x2_t __s0 = __p0; \
  50511   float64x2_t __s1 = __p1; \
  50512   float64x2_t __s2 = __p2; \
  50513   __ret = (float64x2_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 42); \
  50514   __ret; \
  50515 })
  50516 #else
  50517 #define vfmaq_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50518   float64x2_t __ret; \
  50519   float64x2_t __s0 = __p0; \
  50520   float64x2_t __s1 = __p1; \
  50521   float64x2_t __s2 = __p2; \
  50522   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  50523   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  50524   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  50525   __ret = (float64x2_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 42); \
  50526   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  50527   __ret; \
  50528 })
  50529 #define __noswap_vfmaq_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50530   float64x2_t __ret; \
  50531   float64x2_t __s0 = __p0; \
  50532   float64x2_t __s1 = __p1; \
  50533   float64x2_t __s2 = __p2; \
  50534   __ret = (float64x2_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 42); \
  50535   __ret; \
  50536 })
  50537 #endif
  50538 
  50539 #ifdef __LITTLE_ENDIAN__
  50540 #define vfmaq_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50541   float32x4_t __ret; \
  50542   float32x4_t __s0 = __p0; \
  50543   float32x4_t __s1 = __p1; \
  50544   float32x4_t __s2 = __p2; \
  50545   __ret = (float32x4_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 41); \
  50546   __ret; \
  50547 })
  50548 #else
  50549 #define vfmaq_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50550   float32x4_t __ret; \
  50551   float32x4_t __s0 = __p0; \
  50552   float32x4_t __s1 = __p1; \
  50553   float32x4_t __s2 = __p2; \
  50554   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  50555   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  50556   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  50557   __ret = (float32x4_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 41); \
  50558   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  50559   __ret; \
  50560 })
  50561 #define __noswap_vfmaq_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50562   float32x4_t __ret; \
  50563   float32x4_t __s0 = __p0; \
  50564   float32x4_t __s1 = __p1; \
  50565   float32x4_t __s2 = __p2; \
  50566   __ret = (float32x4_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 41); \
  50567   __ret; \
  50568 })
  50569 #endif
  50570 
  50571 #ifdef __LITTLE_ENDIAN__
  50572 #define vfma_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50573   float64x1_t __ret; \
  50574   float64x1_t __s0 = __p0; \
  50575   float64x1_t __s1 = __p1; \
  50576   float64x2_t __s2 = __p2; \
  50577   __ret = (float64x1_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 10); \
  50578   __ret; \
  50579 })
  50580 #else
  50581 #define vfma_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50582   float64x1_t __ret; \
  50583   float64x1_t __s0 = __p0; \
  50584   float64x1_t __s1 = __p1; \
  50585   float64x2_t __s2 = __p2; \
  50586   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  50587   __ret = (float64x1_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__rev2, __p3, 10); \
  50588   __ret; \
  50589 })
  50590 #define __noswap_vfma_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \
  50591   float64x1_t __ret; \
  50592   float64x1_t __s0 = __p0; \
  50593   float64x1_t __s1 = __p1; \
  50594   float64x2_t __s2 = __p2; \
  50595   __ret = (float64x1_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 10); \
  50596   __ret; \
  50597 })
  50598 #endif
  50599 
  50600 #ifdef __LITTLE_ENDIAN__
  50601 #define vfma_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50602   float32x2_t __ret; \
  50603   float32x2_t __s0 = __p0; \
  50604   float32x2_t __s1 = __p1; \
  50605   float32x4_t __s2 = __p2; \
  50606   __ret = (float32x2_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 9); \
  50607   __ret; \
  50608 })
  50609 #else
  50610 #define vfma_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50611   float32x2_t __ret; \
  50612   float32x2_t __s0 = __p0; \
  50613   float32x2_t __s1 = __p1; \
  50614   float32x4_t __s2 = __p2; \
  50615   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  50616   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  50617   float32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  50618   __ret = (float32x2_t) __builtin_neon_vfma_laneq_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x16_t)__rev2, __p3, 9); \
  50619   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  50620   __ret; \
  50621 })
  50622 #define __noswap_vfma_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \
  50623   float32x2_t __ret; \
  50624   float32x2_t __s0 = __p0; \
  50625   float32x2_t __s1 = __p1; \
  50626   float32x4_t __s2 = __p2; \
  50627   __ret = (float32x2_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 9); \
  50628   __ret; \
  50629 })
  50630 #endif
  50631 
  50632 #ifdef __LITTLE_ENDIAN__
  50633 __ai __attribute__((target("neon"))) float64x2_t vfmaq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) {
  50634   float64x2_t __ret;
  50635   __ret = vfmaq_f64(__p0, __p1, (float64x2_t) {__p2, __p2});
  50636   return __ret;
  50637 }
  50638 #else
  50639 __ai __attribute__((target("neon"))) float64x2_t vfmaq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) {
  50640   float64x2_t __ret;
  50641   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  50642   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  50643   __ret = __noswap_vfmaq_f64(__rev0, __rev1, (float64x2_t) {__p2, __p2});
  50644   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50645   return __ret;
  50646 }
  50647 #endif
  50648 
  50649 __ai __attribute__((target("neon"))) float64x1_t vfma_n_f64(float64x1_t __p0, float64x1_t __p1, float64_t __p2) {
  50650   float64x1_t __ret;
  50651   __ret = vfma_f64(__p0, __p1, (float64x1_t) {__p2});
  50652   return __ret;
  50653 }
  50654 #ifdef __LITTLE_ENDIAN__
  50655 __ai __attribute__((target("neon"))) float64x2_t vfmsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  50656   float64x2_t __ret;
  50657   __ret = vfmaq_f64(__p0, -__p1, __p2);
  50658   return __ret;
  50659 }
  50660 #else
  50661 __ai __attribute__((target("neon"))) float64x2_t vfmsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  50662   float64x2_t __ret;
  50663   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  50664   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  50665   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  50666   __ret = __noswap_vfmaq_f64(__rev0, -__rev1, __rev2);
  50667   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50668   return __ret;
  50669 }
  50670 #endif
  50671 
  50672 __ai __attribute__((target("neon"))) float64x1_t vfms_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) {
  50673   float64x1_t __ret;
  50674   __ret = vfma_f64(__p0, -__p1, __p2);
  50675   return __ret;
  50676 }
  50677 #define vfmsd_lane_f64(__p0_426, __p1_426, __p2_426, __p3_426) __extension__ ({ \
  50678   float64_t __ret_426; \
  50679   float64_t __s0_426 = __p0_426; \
  50680   float64_t __s1_426 = __p1_426; \
  50681   float64x1_t __s2_426 = __p2_426; \
  50682   __ret_426 = vfmad_lane_f64(__s0_426, -__s1_426, __s2_426, __p3_426); \
  50683   __ret_426; \
  50684 })
  50685 #ifdef __LITTLE_ENDIAN__
  50686 #define vfmss_lane_f32(__p0_427, __p1_427, __p2_427, __p3_427) __extension__ ({ \
  50687   float32_t __ret_427; \
  50688   float32_t __s0_427 = __p0_427; \
  50689   float32_t __s1_427 = __p1_427; \
  50690   float32x2_t __s2_427 = __p2_427; \
  50691   __ret_427 = vfmas_lane_f32(__s0_427, -__s1_427, __s2_427, __p3_427); \
  50692   __ret_427; \
  50693 })
  50694 #else
  50695 #define vfmss_lane_f32(__p0_428, __p1_428, __p2_428, __p3_428) __extension__ ({ \
  50696   float32_t __ret_428; \
  50697   float32_t __s0_428 = __p0_428; \
  50698   float32_t __s1_428 = __p1_428; \
  50699   float32x2_t __s2_428 = __p2_428; \
  50700   float32x2_t __rev2_428;  __rev2_428 = __builtin_shufflevector(__s2_428, __s2_428, 1, 0); \
  50701   __ret_428 = __noswap_vfmas_lane_f32(__s0_428, -__s1_428, __rev2_428, __p3_428); \
  50702   __ret_428; \
  50703 })
  50704 #endif
  50705 
  50706 #ifdef __LITTLE_ENDIAN__
  50707 #define vfmsq_lane_f64(__p0_429, __p1_429, __p2_429, __p3_429) __extension__ ({ \
  50708   float64x2_t __ret_429; \
  50709   float64x2_t __s0_429 = __p0_429; \
  50710   float64x2_t __s1_429 = __p1_429; \
  50711   float64x1_t __s2_429 = __p2_429; \
  50712   __ret_429 = vfmaq_lane_f64(__s0_429, -__s1_429, __s2_429, __p3_429); \
  50713   __ret_429; \
  50714 })
  50715 #else
  50716 #define vfmsq_lane_f64(__p0_430, __p1_430, __p2_430, __p3_430) __extension__ ({ \
  50717   float64x2_t __ret_430; \
  50718   float64x2_t __s0_430 = __p0_430; \
  50719   float64x2_t __s1_430 = __p1_430; \
  50720   float64x1_t __s2_430 = __p2_430; \
  50721   float64x2_t __rev0_430;  __rev0_430 = __builtin_shufflevector(__s0_430, __s0_430, 1, 0); \
  50722   float64x2_t __rev1_430;  __rev1_430 = __builtin_shufflevector(__s1_430, __s1_430, 1, 0); \
  50723   __ret_430 = __noswap_vfmaq_lane_f64(__rev0_430, -__rev1_430, __s2_430, __p3_430); \
  50724   __ret_430 = __builtin_shufflevector(__ret_430, __ret_430, 1, 0); \
  50725   __ret_430; \
  50726 })
  50727 #endif
  50728 
  50729 #ifdef __LITTLE_ENDIAN__
  50730 #define vfmsq_lane_f32(__p0_431, __p1_431, __p2_431, __p3_431) __extension__ ({ \
  50731   float32x4_t __ret_431; \
  50732   float32x4_t __s0_431 = __p0_431; \
  50733   float32x4_t __s1_431 = __p1_431; \
  50734   float32x2_t __s2_431 = __p2_431; \
  50735   __ret_431 = vfmaq_lane_f32(__s0_431, -__s1_431, __s2_431, __p3_431); \
  50736   __ret_431; \
  50737 })
  50738 #else
  50739 #define vfmsq_lane_f32(__p0_432, __p1_432, __p2_432, __p3_432) __extension__ ({ \
  50740   float32x4_t __ret_432; \
  50741   float32x4_t __s0_432 = __p0_432; \
  50742   float32x4_t __s1_432 = __p1_432; \
  50743   float32x2_t __s2_432 = __p2_432; \
  50744   float32x4_t __rev0_432;  __rev0_432 = __builtin_shufflevector(__s0_432, __s0_432, 3, 2, 1, 0); \
  50745   float32x4_t __rev1_432;  __rev1_432 = __builtin_shufflevector(__s1_432, __s1_432, 3, 2, 1, 0); \
  50746   float32x2_t __rev2_432;  __rev2_432 = __builtin_shufflevector(__s2_432, __s2_432, 1, 0); \
  50747   __ret_432 = __noswap_vfmaq_lane_f32(__rev0_432, -__rev1_432, __rev2_432, __p3_432); \
  50748   __ret_432 = __builtin_shufflevector(__ret_432, __ret_432, 3, 2, 1, 0); \
  50749   __ret_432; \
  50750 })
  50751 #endif
  50752 
  50753 #define vfms_lane_f64(__p0_433, __p1_433, __p2_433, __p3_433) __extension__ ({ \
  50754   float64x1_t __ret_433; \
  50755   float64x1_t __s0_433 = __p0_433; \
  50756   float64x1_t __s1_433 = __p1_433; \
  50757   float64x1_t __s2_433 = __p2_433; \
  50758   __ret_433 = vfma_lane_f64(__s0_433, -__s1_433, __s2_433, __p3_433); \
  50759   __ret_433; \
  50760 })
  50761 #ifdef __LITTLE_ENDIAN__
  50762 #define vfms_lane_f32(__p0_434, __p1_434, __p2_434, __p3_434) __extension__ ({ \
  50763   float32x2_t __ret_434; \
  50764   float32x2_t __s0_434 = __p0_434; \
  50765   float32x2_t __s1_434 = __p1_434; \
  50766   float32x2_t __s2_434 = __p2_434; \
  50767   __ret_434 = vfma_lane_f32(__s0_434, -__s1_434, __s2_434, __p3_434); \
  50768   __ret_434; \
  50769 })
  50770 #else
  50771 #define vfms_lane_f32(__p0_435, __p1_435, __p2_435, __p3_435) __extension__ ({ \
  50772   float32x2_t __ret_435; \
  50773   float32x2_t __s0_435 = __p0_435; \
  50774   float32x2_t __s1_435 = __p1_435; \
  50775   float32x2_t __s2_435 = __p2_435; \
  50776   float32x2_t __rev0_435;  __rev0_435 = __builtin_shufflevector(__s0_435, __s0_435, 1, 0); \
  50777   float32x2_t __rev1_435;  __rev1_435 = __builtin_shufflevector(__s1_435, __s1_435, 1, 0); \
  50778   float32x2_t __rev2_435;  __rev2_435 = __builtin_shufflevector(__s2_435, __s2_435, 1, 0); \
  50779   __ret_435 = __noswap_vfma_lane_f32(__rev0_435, -__rev1_435, __rev2_435, __p3_435); \
  50780   __ret_435 = __builtin_shufflevector(__ret_435, __ret_435, 1, 0); \
  50781   __ret_435; \
  50782 })
  50783 #endif
  50784 
  50785 #ifdef __LITTLE_ENDIAN__
  50786 #define vfmsd_laneq_f64(__p0_436, __p1_436, __p2_436, __p3_436) __extension__ ({ \
  50787   float64_t __ret_436; \
  50788   float64_t __s0_436 = __p0_436; \
  50789   float64_t __s1_436 = __p1_436; \
  50790   float64x2_t __s2_436 = __p2_436; \
  50791   __ret_436 = vfmad_laneq_f64(__s0_436, -__s1_436, __s2_436, __p3_436); \
  50792   __ret_436; \
  50793 })
  50794 #else
  50795 #define vfmsd_laneq_f64(__p0_437, __p1_437, __p2_437, __p3_437) __extension__ ({ \
  50796   float64_t __ret_437; \
  50797   float64_t __s0_437 = __p0_437; \
  50798   float64_t __s1_437 = __p1_437; \
  50799   float64x2_t __s2_437 = __p2_437; \
  50800   float64x2_t __rev2_437;  __rev2_437 = __builtin_shufflevector(__s2_437, __s2_437, 1, 0); \
  50801   __ret_437 = __noswap_vfmad_laneq_f64(__s0_437, -__s1_437, __rev2_437, __p3_437); \
  50802   __ret_437; \
  50803 })
  50804 #endif
  50805 
  50806 #ifdef __LITTLE_ENDIAN__
  50807 #define vfmss_laneq_f32(__p0_438, __p1_438, __p2_438, __p3_438) __extension__ ({ \
  50808   float32_t __ret_438; \
  50809   float32_t __s0_438 = __p0_438; \
  50810   float32_t __s1_438 = __p1_438; \
  50811   float32x4_t __s2_438 = __p2_438; \
  50812   __ret_438 = vfmas_laneq_f32(__s0_438, -__s1_438, __s2_438, __p3_438); \
  50813   __ret_438; \
  50814 })
  50815 #else
  50816 #define vfmss_laneq_f32(__p0_439, __p1_439, __p2_439, __p3_439) __extension__ ({ \
  50817   float32_t __ret_439; \
  50818   float32_t __s0_439 = __p0_439; \
  50819   float32_t __s1_439 = __p1_439; \
  50820   float32x4_t __s2_439 = __p2_439; \
  50821   float32x4_t __rev2_439;  __rev2_439 = __builtin_shufflevector(__s2_439, __s2_439, 3, 2, 1, 0); \
  50822   __ret_439 = __noswap_vfmas_laneq_f32(__s0_439, -__s1_439, __rev2_439, __p3_439); \
  50823   __ret_439; \
  50824 })
  50825 #endif
  50826 
  50827 #ifdef __LITTLE_ENDIAN__
  50828 #define vfmsq_laneq_f64(__p0_440, __p1_440, __p2_440, __p3_440) __extension__ ({ \
  50829   float64x2_t __ret_440; \
  50830   float64x2_t __s0_440 = __p0_440; \
  50831   float64x2_t __s1_440 = __p1_440; \
  50832   float64x2_t __s2_440 = __p2_440; \
  50833   __ret_440 = vfmaq_laneq_f64(__s0_440, -__s1_440, __s2_440, __p3_440); \
  50834   __ret_440; \
  50835 })
  50836 #else
  50837 #define vfmsq_laneq_f64(__p0_441, __p1_441, __p2_441, __p3_441) __extension__ ({ \
  50838   float64x2_t __ret_441; \
  50839   float64x2_t __s0_441 = __p0_441; \
  50840   float64x2_t __s1_441 = __p1_441; \
  50841   float64x2_t __s2_441 = __p2_441; \
  50842   float64x2_t __rev0_441;  __rev0_441 = __builtin_shufflevector(__s0_441, __s0_441, 1, 0); \
  50843   float64x2_t __rev1_441;  __rev1_441 = __builtin_shufflevector(__s1_441, __s1_441, 1, 0); \
  50844   float64x2_t __rev2_441;  __rev2_441 = __builtin_shufflevector(__s2_441, __s2_441, 1, 0); \
  50845   __ret_441 = __noswap_vfmaq_laneq_f64(__rev0_441, -__rev1_441, __rev2_441, __p3_441); \
  50846   __ret_441 = __builtin_shufflevector(__ret_441, __ret_441, 1, 0); \
  50847   __ret_441; \
  50848 })
  50849 #endif
  50850 
  50851 #ifdef __LITTLE_ENDIAN__
  50852 #define vfmsq_laneq_f32(__p0_442, __p1_442, __p2_442, __p3_442) __extension__ ({ \
  50853   float32x4_t __ret_442; \
  50854   float32x4_t __s0_442 = __p0_442; \
  50855   float32x4_t __s1_442 = __p1_442; \
  50856   float32x4_t __s2_442 = __p2_442; \
  50857   __ret_442 = vfmaq_laneq_f32(__s0_442, -__s1_442, __s2_442, __p3_442); \
  50858   __ret_442; \
  50859 })
  50860 #else
  50861 #define vfmsq_laneq_f32(__p0_443, __p1_443, __p2_443, __p3_443) __extension__ ({ \
  50862   float32x4_t __ret_443; \
  50863   float32x4_t __s0_443 = __p0_443; \
  50864   float32x4_t __s1_443 = __p1_443; \
  50865   float32x4_t __s2_443 = __p2_443; \
  50866   float32x4_t __rev0_443;  __rev0_443 = __builtin_shufflevector(__s0_443, __s0_443, 3, 2, 1, 0); \
  50867   float32x4_t __rev1_443;  __rev1_443 = __builtin_shufflevector(__s1_443, __s1_443, 3, 2, 1, 0); \
  50868   float32x4_t __rev2_443;  __rev2_443 = __builtin_shufflevector(__s2_443, __s2_443, 3, 2, 1, 0); \
  50869   __ret_443 = __noswap_vfmaq_laneq_f32(__rev0_443, -__rev1_443, __rev2_443, __p3_443); \
  50870   __ret_443 = __builtin_shufflevector(__ret_443, __ret_443, 3, 2, 1, 0); \
  50871   __ret_443; \
  50872 })
  50873 #endif
  50874 
  50875 #ifdef __LITTLE_ENDIAN__
  50876 #define vfms_laneq_f64(__p0_444, __p1_444, __p2_444, __p3_444) __extension__ ({ \
  50877   float64x1_t __ret_444; \
  50878   float64x1_t __s0_444 = __p0_444; \
  50879   float64x1_t __s1_444 = __p1_444; \
  50880   float64x2_t __s2_444 = __p2_444; \
  50881   __ret_444 = vfma_laneq_f64(__s0_444, -__s1_444, __s2_444, __p3_444); \
  50882   __ret_444; \
  50883 })
  50884 #else
  50885 #define vfms_laneq_f64(__p0_445, __p1_445, __p2_445, __p3_445) __extension__ ({ \
  50886   float64x1_t __ret_445; \
  50887   float64x1_t __s0_445 = __p0_445; \
  50888   float64x1_t __s1_445 = __p1_445; \
  50889   float64x2_t __s2_445 = __p2_445; \
  50890   float64x2_t __rev2_445;  __rev2_445 = __builtin_shufflevector(__s2_445, __s2_445, 1, 0); \
  50891   __ret_445 = __noswap_vfma_laneq_f64(__s0_445, -__s1_445, __rev2_445, __p3_445); \
  50892   __ret_445; \
  50893 })
  50894 #endif
  50895 
  50896 #ifdef __LITTLE_ENDIAN__
  50897 #define vfms_laneq_f32(__p0_446, __p1_446, __p2_446, __p3_446) __extension__ ({ \
  50898   float32x2_t __ret_446; \
  50899   float32x2_t __s0_446 = __p0_446; \
  50900   float32x2_t __s1_446 = __p1_446; \
  50901   float32x4_t __s2_446 = __p2_446; \
  50902   __ret_446 = vfma_laneq_f32(__s0_446, -__s1_446, __s2_446, __p3_446); \
  50903   __ret_446; \
  50904 })
  50905 #else
  50906 #define vfms_laneq_f32(__p0_447, __p1_447, __p2_447, __p3_447) __extension__ ({ \
  50907   float32x2_t __ret_447; \
  50908   float32x2_t __s0_447 = __p0_447; \
  50909   float32x2_t __s1_447 = __p1_447; \
  50910   float32x4_t __s2_447 = __p2_447; \
  50911   float32x2_t __rev0_447;  __rev0_447 = __builtin_shufflevector(__s0_447, __s0_447, 1, 0); \
  50912   float32x2_t __rev1_447;  __rev1_447 = __builtin_shufflevector(__s1_447, __s1_447, 1, 0); \
  50913   float32x4_t __rev2_447;  __rev2_447 = __builtin_shufflevector(__s2_447, __s2_447, 3, 2, 1, 0); \
  50914   __ret_447 = __noswap_vfma_laneq_f32(__rev0_447, -__rev1_447, __rev2_447, __p3_447); \
  50915   __ret_447 = __builtin_shufflevector(__ret_447, __ret_447, 1, 0); \
  50916   __ret_447; \
  50917 })
  50918 #endif
  50919 
  50920 #ifdef __LITTLE_ENDIAN__
  50921 __ai __attribute__((target("neon"))) float64x2_t vfmsq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) {
  50922   float64x2_t __ret;
  50923   __ret = vfmaq_f64(__p0, -__p1, (float64x2_t) {__p2, __p2});
  50924   return __ret;
  50925 }
  50926 #else
  50927 __ai __attribute__((target("neon"))) float64x2_t vfmsq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) {
  50928   float64x2_t __ret;
  50929   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  50930   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  50931   __ret = __noswap_vfmaq_f64(__rev0, -__rev1, (float64x2_t) {__p2, __p2});
  50932   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50933   return __ret;
  50934 }
  50935 #endif
  50936 
  50937 #ifdef __LITTLE_ENDIAN__
  50938 __ai __attribute__((target("neon"))) float32x4_t vfmsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  50939   float32x4_t __ret;
  50940   __ret = vfmaq_f32(__p0, -__p1, (float32x4_t) {__p2, __p2, __p2, __p2});
  50941   return __ret;
  50942 }
  50943 #else
  50944 __ai __attribute__((target("neon"))) float32x4_t vfmsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) {
  50945   float32x4_t __ret;
  50946   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  50947   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  50948   __ret = __noswap_vfmaq_f32(__rev0, -__rev1, (float32x4_t) {__p2, __p2, __p2, __p2});
  50949   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  50950   return __ret;
  50951 }
  50952 #endif
  50953 
  50954 __ai __attribute__((target("neon"))) float64x1_t vfms_n_f64(float64x1_t __p0, float64x1_t __p1, float64_t __p2) {
  50955   float64x1_t __ret;
  50956   __ret = vfma_f64(__p0, -__p1, (float64x1_t) {__p2});
  50957   return __ret;
  50958 }
  50959 #ifdef __LITTLE_ENDIAN__
  50960 __ai __attribute__((target("neon"))) float32x2_t vfms_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  50961   float32x2_t __ret;
  50962   __ret = vfma_f32(__p0, -__p1, (float32x2_t) {__p2, __p2});
  50963   return __ret;
  50964 }
  50965 #else
  50966 __ai __attribute__((target("neon"))) float32x2_t vfms_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) {
  50967   float32x2_t __ret;
  50968   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  50969   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  50970   __ret = __noswap_vfma_f32(__rev0, -__rev1, (float32x2_t) {__p2, __p2});
  50971   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  50972   return __ret;
  50973 }
  50974 #endif
  50975 
  50976 #ifdef __LITTLE_ENDIAN__
  50977 __ai __attribute__((target("neon"))) poly64x1_t vget_high_p64(poly64x2_t __p0) {
  50978   poly64x1_t __ret;
  50979   __ret = __builtin_shufflevector(__p0, __p0, 1);
  50980   return __ret;
  50981 }
  50982 #else
  50983 __ai __attribute__((target("neon"))) poly64x1_t vget_high_p64(poly64x2_t __p0) {
  50984   poly64x1_t __ret;
  50985   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  50986   __ret = __builtin_shufflevector(__rev0, __rev0, 1);
  50987   return __ret;
  50988 }
  50989 __ai __attribute__((target("neon"))) poly64x1_t __noswap_vget_high_p64(poly64x2_t __p0) {
  50990   poly64x1_t __ret;
  50991   __ret = __builtin_shufflevector(__p0, __p0, 1);
  50992   return __ret;
  50993 }
  50994 #endif
  50995 
  50996 #ifdef __LITTLE_ENDIAN__
  50997 __ai __attribute__((target("neon"))) float64x1_t vget_high_f64(float64x2_t __p0) {
  50998   float64x1_t __ret;
  50999   __ret = __builtin_shufflevector(__p0, __p0, 1);
  51000   return __ret;
  51001 }
  51002 #else
  51003 __ai __attribute__((target("neon"))) float64x1_t vget_high_f64(float64x2_t __p0) {
  51004   float64x1_t __ret;
  51005   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  51006   __ret = __builtin_shufflevector(__rev0, __rev0, 1);
  51007   return __ret;
  51008 }
  51009 #endif
  51010 
  51011 #define vget_lane_p64(__p0, __p1) __extension__ ({ \
  51012   poly64_t __ret; \
  51013   poly64x1_t __s0 = __p0; \
  51014   __ret = (poly64_t) __builtin_neon_vget_lane_i64((poly64x1_t)__s0, __p1); \
  51015   __ret; \
  51016 })
  51017 #ifdef __LITTLE_ENDIAN__
  51018 #define vgetq_lane_p64(__p0, __p1) __extension__ ({ \
  51019   poly64_t __ret; \
  51020   poly64x2_t __s0 = __p0; \
  51021   __ret = (poly64_t) __builtin_neon_vgetq_lane_i64((poly64x2_t)__s0, __p1); \
  51022   __ret; \
  51023 })
  51024 #else
  51025 #define vgetq_lane_p64(__p0, __p1) __extension__ ({ \
  51026   poly64_t __ret; \
  51027   poly64x2_t __s0 = __p0; \
  51028   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  51029   __ret = (poly64_t) __builtin_neon_vgetq_lane_i64((poly64x2_t)__rev0, __p1); \
  51030   __ret; \
  51031 })
  51032 #define __noswap_vgetq_lane_p64(__p0, __p1) __extension__ ({ \
  51033   poly64_t __ret; \
  51034   poly64x2_t __s0 = __p0; \
  51035   __ret = (poly64_t) __builtin_neon_vgetq_lane_i64((poly64x2_t)__s0, __p1); \
  51036   __ret; \
  51037 })
  51038 #endif
  51039 
  51040 #ifdef __LITTLE_ENDIAN__
  51041 #define vgetq_lane_f64(__p0, __p1) __extension__ ({ \
  51042   float64_t __ret; \
  51043   float64x2_t __s0 = __p0; \
  51044   __ret = (float64_t) __builtin_neon_vgetq_lane_f64((float64x2_t)__s0, __p1); \
  51045   __ret; \
  51046 })
  51047 #else
  51048 #define vgetq_lane_f64(__p0, __p1) __extension__ ({ \
  51049   float64_t __ret; \
  51050   float64x2_t __s0 = __p0; \
  51051   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  51052   __ret = (float64_t) __builtin_neon_vgetq_lane_f64((float64x2_t)__rev0, __p1); \
  51053   __ret; \
  51054 })
  51055 #define __noswap_vgetq_lane_f64(__p0, __p1) __extension__ ({ \
  51056   float64_t __ret; \
  51057   float64x2_t __s0 = __p0; \
  51058   __ret = (float64_t) __builtin_neon_vgetq_lane_f64((float64x2_t)__s0, __p1); \
  51059   __ret; \
  51060 })
  51061 #endif
  51062 
  51063 #define vget_lane_f64(__p0, __p1) __extension__ ({ \
  51064   float64_t __ret; \
  51065   float64x1_t __s0 = __p0; \
  51066   __ret = (float64_t) __builtin_neon_vget_lane_f64((float64x1_t)__s0, __p1); \
  51067   __ret; \
  51068 })
  51069 #ifdef __LITTLE_ENDIAN__
  51070 __ai __attribute__((target("neon"))) poly64x1_t vget_low_p64(poly64x2_t __p0) {
  51071   poly64x1_t __ret;
  51072   __ret = __builtin_shufflevector(__p0, __p0, 0);
  51073   return __ret;
  51074 }
  51075 #else
  51076 __ai __attribute__((target("neon"))) poly64x1_t vget_low_p64(poly64x2_t __p0) {
  51077   poly64x1_t __ret;
  51078   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  51079   __ret = __builtin_shufflevector(__rev0, __rev0, 0);
  51080   return __ret;
  51081 }
  51082 #endif
  51083 
  51084 #ifdef __LITTLE_ENDIAN__
  51085 __ai __attribute__((target("neon"))) float64x1_t vget_low_f64(float64x2_t __p0) {
  51086   float64x1_t __ret;
  51087   __ret = __builtin_shufflevector(__p0, __p0, 0);
  51088   return __ret;
  51089 }
  51090 #else
  51091 __ai __attribute__((target("neon"))) float64x1_t vget_low_f64(float64x2_t __p0) {
  51092   float64x1_t __ret;
  51093   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  51094   __ret = __builtin_shufflevector(__rev0, __rev0, 0);
  51095   return __ret;
  51096 }
  51097 #endif
  51098 
  51099 #define vld1_p64(__p0) __extension__ ({ \
  51100   poly64x1_t __ret; \
  51101   __ret = (poly64x1_t) __builtin_neon_vld1_v(__p0, 6); \
  51102   __ret; \
  51103 })
  51104 #ifdef __LITTLE_ENDIAN__
  51105 #define vld1q_p64(__p0) __extension__ ({ \
  51106   poly64x2_t __ret; \
  51107   __ret = (poly64x2_t) __builtin_neon_vld1q_v(__p0, 38); \
  51108   __ret; \
  51109 })
  51110 #else
  51111 #define vld1q_p64(__p0) __extension__ ({ \
  51112   poly64x2_t __ret; \
  51113   __ret = (poly64x2_t) __builtin_neon_vld1q_v(__p0, 38); \
  51114   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  51115   __ret; \
  51116 })
  51117 #endif
  51118 
  51119 #ifdef __LITTLE_ENDIAN__
  51120 #define vld1q_f64(__p0) __extension__ ({ \
  51121   float64x2_t __ret; \
  51122   __ret = (float64x2_t) __builtin_neon_vld1q_v(__p0, 42); \
  51123   __ret; \
  51124 })
  51125 #else
  51126 #define vld1q_f64(__p0) __extension__ ({ \
  51127   float64x2_t __ret; \
  51128   __ret = (float64x2_t) __builtin_neon_vld1q_v(__p0, 42); \
  51129   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  51130   __ret; \
  51131 })
  51132 #endif
  51133 
  51134 #define vld1_f64(__p0) __extension__ ({ \
  51135   float64x1_t __ret; \
  51136   __ret = (float64x1_t) __builtin_neon_vld1_v(__p0, 10); \
  51137   __ret; \
  51138 })
  51139 #define vld1_dup_p64(__p0) __extension__ ({ \
  51140   poly64x1_t __ret; \
  51141   __ret = (poly64x1_t) __builtin_neon_vld1_dup_v(__p0, 6); \
  51142   __ret; \
  51143 })
  51144 #ifdef __LITTLE_ENDIAN__
  51145 #define vld1q_dup_p64(__p0) __extension__ ({ \
  51146   poly64x2_t __ret; \
  51147   __ret = (poly64x2_t) __builtin_neon_vld1q_dup_v(__p0, 38); \
  51148   __ret; \
  51149 })
  51150 #else
  51151 #define vld1q_dup_p64(__p0) __extension__ ({ \
  51152   poly64x2_t __ret; \
  51153   __ret = (poly64x2_t) __builtin_neon_vld1q_dup_v(__p0, 38); \
  51154   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  51155   __ret; \
  51156 })
  51157 #endif
  51158 
  51159 #ifdef __LITTLE_ENDIAN__
  51160 #define vld1q_dup_f64(__p0) __extension__ ({ \
  51161   float64x2_t __ret; \
  51162   __ret = (float64x2_t) __builtin_neon_vld1q_dup_v(__p0, 42); \
  51163   __ret; \
  51164 })
  51165 #else
  51166 #define vld1q_dup_f64(__p0) __extension__ ({ \
  51167   float64x2_t __ret; \
  51168   __ret = (float64x2_t) __builtin_neon_vld1q_dup_v(__p0, 42); \
  51169   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  51170   __ret; \
  51171 })
  51172 #endif
  51173 
  51174 #define vld1_dup_f64(__p0) __extension__ ({ \
  51175   float64x1_t __ret; \
  51176   __ret = (float64x1_t) __builtin_neon_vld1_dup_v(__p0, 10); \
  51177   __ret; \
  51178 })
  51179 #define vld1_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51180   poly64x1_t __ret; \
  51181   poly64x1_t __s1 = __p1; \
  51182   __ret = (poly64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 6); \
  51183   __ret; \
  51184 })
  51185 #ifdef __LITTLE_ENDIAN__
  51186 #define vld1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51187   poly64x2_t __ret; \
  51188   poly64x2_t __s1 = __p1; \
  51189   __ret = (poly64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 38); \
  51190   __ret; \
  51191 })
  51192 #else
  51193 #define vld1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51194   poly64x2_t __ret; \
  51195   poly64x2_t __s1 = __p1; \
  51196   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  51197   __ret = (poly64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 38); \
  51198   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  51199   __ret; \
  51200 })
  51201 #endif
  51202 
  51203 #ifdef __LITTLE_ENDIAN__
  51204 #define vld1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51205   float64x2_t __ret; \
  51206   float64x2_t __s1 = __p1; \
  51207   __ret = (float64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 42); \
  51208   __ret; \
  51209 })
  51210 #else
  51211 #define vld1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51212   float64x2_t __ret; \
  51213   float64x2_t __s1 = __p1; \
  51214   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  51215   __ret = (float64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 42); \
  51216   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  51217   __ret; \
  51218 })
  51219 #endif
  51220 
  51221 #define vld1_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51222   float64x1_t __ret; \
  51223   float64x1_t __s1 = __p1; \
  51224   __ret = (float64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 10); \
  51225   __ret; \
  51226 })
  51227 #define vld1_p64_x2(__p0) __extension__ ({ \
  51228   poly64x1x2_t __ret; \
  51229   __builtin_neon_vld1_x2_v(&__ret, __p0, 6); \
  51230   __ret; \
  51231 })
  51232 #ifdef __LITTLE_ENDIAN__
  51233 #define vld1q_p64_x2(__p0) __extension__ ({ \
  51234   poly64x2x2_t __ret; \
  51235   __builtin_neon_vld1q_x2_v(&__ret, __p0, 38); \
  51236   __ret; \
  51237 })
  51238 #else
  51239 #define vld1q_p64_x2(__p0) __extension__ ({ \
  51240   poly64x2x2_t __ret; \
  51241   __builtin_neon_vld1q_x2_v(&__ret, __p0, 38); \
  51242  \
  51243   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51244   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51245   __ret; \
  51246 })
  51247 #endif
  51248 
  51249 #ifdef __LITTLE_ENDIAN__
  51250 #define vld1q_f64_x2(__p0) __extension__ ({ \
  51251   float64x2x2_t __ret; \
  51252   __builtin_neon_vld1q_x2_v(&__ret, __p0, 42); \
  51253   __ret; \
  51254 })
  51255 #else
  51256 #define vld1q_f64_x2(__p0) __extension__ ({ \
  51257   float64x2x2_t __ret; \
  51258   __builtin_neon_vld1q_x2_v(&__ret, __p0, 42); \
  51259  \
  51260   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51261   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51262   __ret; \
  51263 })
  51264 #endif
  51265 
  51266 #define vld1_f64_x2(__p0) __extension__ ({ \
  51267   float64x1x2_t __ret; \
  51268   __builtin_neon_vld1_x2_v(&__ret, __p0, 10); \
  51269   __ret; \
  51270 })
  51271 #define vld1_p64_x3(__p0) __extension__ ({ \
  51272   poly64x1x3_t __ret; \
  51273   __builtin_neon_vld1_x3_v(&__ret, __p0, 6); \
  51274   __ret; \
  51275 })
  51276 #ifdef __LITTLE_ENDIAN__
  51277 #define vld1q_p64_x3(__p0) __extension__ ({ \
  51278   poly64x2x3_t __ret; \
  51279   __builtin_neon_vld1q_x3_v(&__ret, __p0, 38); \
  51280   __ret; \
  51281 })
  51282 #else
  51283 #define vld1q_p64_x3(__p0) __extension__ ({ \
  51284   poly64x2x3_t __ret; \
  51285   __builtin_neon_vld1q_x3_v(&__ret, __p0, 38); \
  51286  \
  51287   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51288   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51289   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51290   __ret; \
  51291 })
  51292 #endif
  51293 
  51294 #ifdef __LITTLE_ENDIAN__
  51295 #define vld1q_f64_x3(__p0) __extension__ ({ \
  51296   float64x2x3_t __ret; \
  51297   __builtin_neon_vld1q_x3_v(&__ret, __p0, 42); \
  51298   __ret; \
  51299 })
  51300 #else
  51301 #define vld1q_f64_x3(__p0) __extension__ ({ \
  51302   float64x2x3_t __ret; \
  51303   __builtin_neon_vld1q_x3_v(&__ret, __p0, 42); \
  51304  \
  51305   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51306   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51307   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51308   __ret; \
  51309 })
  51310 #endif
  51311 
  51312 #define vld1_f64_x3(__p0) __extension__ ({ \
  51313   float64x1x3_t __ret; \
  51314   __builtin_neon_vld1_x3_v(&__ret, __p0, 10); \
  51315   __ret; \
  51316 })
  51317 #define vld1_p64_x4(__p0) __extension__ ({ \
  51318   poly64x1x4_t __ret; \
  51319   __builtin_neon_vld1_x4_v(&__ret, __p0, 6); \
  51320   __ret; \
  51321 })
  51322 #ifdef __LITTLE_ENDIAN__
  51323 #define vld1q_p64_x4(__p0) __extension__ ({ \
  51324   poly64x2x4_t __ret; \
  51325   __builtin_neon_vld1q_x4_v(&__ret, __p0, 38); \
  51326   __ret; \
  51327 })
  51328 #else
  51329 #define vld1q_p64_x4(__p0) __extension__ ({ \
  51330   poly64x2x4_t __ret; \
  51331   __builtin_neon_vld1q_x4_v(&__ret, __p0, 38); \
  51332  \
  51333   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51334   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51335   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51336   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  51337   __ret; \
  51338 })
  51339 #endif
  51340 
  51341 #ifdef __LITTLE_ENDIAN__
  51342 #define vld1q_f64_x4(__p0) __extension__ ({ \
  51343   float64x2x4_t __ret; \
  51344   __builtin_neon_vld1q_x4_v(&__ret, __p0, 42); \
  51345   __ret; \
  51346 })
  51347 #else
  51348 #define vld1q_f64_x4(__p0) __extension__ ({ \
  51349   float64x2x4_t __ret; \
  51350   __builtin_neon_vld1q_x4_v(&__ret, __p0, 42); \
  51351  \
  51352   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51353   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51354   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51355   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  51356   __ret; \
  51357 })
  51358 #endif
  51359 
  51360 #define vld1_f64_x4(__p0) __extension__ ({ \
  51361   float64x1x4_t __ret; \
  51362   __builtin_neon_vld1_x4_v(&__ret, __p0, 10); \
  51363   __ret; \
  51364 })
  51365 #define vld2_p64(__p0) __extension__ ({ \
  51366   poly64x1x2_t __ret; \
  51367   __builtin_neon_vld2_v(&__ret, __p0, 6); \
  51368   __ret; \
  51369 })
  51370 #ifdef __LITTLE_ENDIAN__
  51371 #define vld2q_p64(__p0) __extension__ ({ \
  51372   poly64x2x2_t __ret; \
  51373   __builtin_neon_vld2q_v(&__ret, __p0, 38); \
  51374   __ret; \
  51375 })
  51376 #else
  51377 #define vld2q_p64(__p0) __extension__ ({ \
  51378   poly64x2x2_t __ret; \
  51379   __builtin_neon_vld2q_v(&__ret, __p0, 38); \
  51380  \
  51381   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51382   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51383   __ret; \
  51384 })
  51385 #endif
  51386 
  51387 #ifdef __LITTLE_ENDIAN__
  51388 #define vld2q_u64(__p0) __extension__ ({ \
  51389   uint64x2x2_t __ret; \
  51390   __builtin_neon_vld2q_v(&__ret, __p0, 51); \
  51391   __ret; \
  51392 })
  51393 #else
  51394 #define vld2q_u64(__p0) __extension__ ({ \
  51395   uint64x2x2_t __ret; \
  51396   __builtin_neon_vld2q_v(&__ret, __p0, 51); \
  51397  \
  51398   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51399   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51400   __ret; \
  51401 })
  51402 #endif
  51403 
  51404 #ifdef __LITTLE_ENDIAN__
  51405 #define vld2q_f64(__p0) __extension__ ({ \
  51406   float64x2x2_t __ret; \
  51407   __builtin_neon_vld2q_v(&__ret, __p0, 42); \
  51408   __ret; \
  51409 })
  51410 #else
  51411 #define vld2q_f64(__p0) __extension__ ({ \
  51412   float64x2x2_t __ret; \
  51413   __builtin_neon_vld2q_v(&__ret, __p0, 42); \
  51414  \
  51415   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51416   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51417   __ret; \
  51418 })
  51419 #endif
  51420 
  51421 #ifdef __LITTLE_ENDIAN__
  51422 #define vld2q_s64(__p0) __extension__ ({ \
  51423   int64x2x2_t __ret; \
  51424   __builtin_neon_vld2q_v(&__ret, __p0, 35); \
  51425   __ret; \
  51426 })
  51427 #else
  51428 #define vld2q_s64(__p0) __extension__ ({ \
  51429   int64x2x2_t __ret; \
  51430   __builtin_neon_vld2q_v(&__ret, __p0, 35); \
  51431  \
  51432   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51433   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51434   __ret; \
  51435 })
  51436 #endif
  51437 
  51438 #define vld2_f64(__p0) __extension__ ({ \
  51439   float64x1x2_t __ret; \
  51440   __builtin_neon_vld2_v(&__ret, __p0, 10); \
  51441   __ret; \
  51442 })
  51443 #define vld2_dup_p64(__p0) __extension__ ({ \
  51444   poly64x1x2_t __ret; \
  51445   __builtin_neon_vld2_dup_v(&__ret, __p0, 6); \
  51446   __ret; \
  51447 })
  51448 #ifdef __LITTLE_ENDIAN__
  51449 #define vld2q_dup_p64(__p0) __extension__ ({ \
  51450   poly64x2x2_t __ret; \
  51451   __builtin_neon_vld2q_dup_v(&__ret, __p0, 38); \
  51452   __ret; \
  51453 })
  51454 #else
  51455 #define vld2q_dup_p64(__p0) __extension__ ({ \
  51456   poly64x2x2_t __ret; \
  51457   __builtin_neon_vld2q_dup_v(&__ret, __p0, 38); \
  51458  \
  51459   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51460   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51461   __ret; \
  51462 })
  51463 #endif
  51464 
  51465 #ifdef __LITTLE_ENDIAN__
  51466 #define vld2q_dup_f64(__p0) __extension__ ({ \
  51467   float64x2x2_t __ret; \
  51468   __builtin_neon_vld2q_dup_v(&__ret, __p0, 42); \
  51469   __ret; \
  51470 })
  51471 #else
  51472 #define vld2q_dup_f64(__p0) __extension__ ({ \
  51473   float64x2x2_t __ret; \
  51474   __builtin_neon_vld2q_dup_v(&__ret, __p0, 42); \
  51475  \
  51476   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51477   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51478   __ret; \
  51479 })
  51480 #endif
  51481 
  51482 #define vld2_dup_f64(__p0) __extension__ ({ \
  51483   float64x1x2_t __ret; \
  51484   __builtin_neon_vld2_dup_v(&__ret, __p0, 10); \
  51485   __ret; \
  51486 })
  51487 #define vld2_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51488   poly64x1x2_t __ret; \
  51489   poly64x1x2_t __s1 = __p1; \
  51490   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 6); \
  51491   __ret; \
  51492 })
  51493 #ifdef __LITTLE_ENDIAN__
  51494 #define vld2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  51495   poly8x16x2_t __ret; \
  51496   poly8x16x2_t __s1 = __p1; \
  51497   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 36); \
  51498   __ret; \
  51499 })
  51500 #else
  51501 #define vld2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  51502   poly8x16x2_t __ret; \
  51503   poly8x16x2_t __s1 = __p1; \
  51504   poly8x16x2_t __rev1; \
  51505   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51506   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51507   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 36); \
  51508  \
  51509   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51510   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51511   __ret; \
  51512 })
  51513 #endif
  51514 
  51515 #ifdef __LITTLE_ENDIAN__
  51516 #define vld2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51517   poly64x2x2_t __ret; \
  51518   poly64x2x2_t __s1 = __p1; \
  51519   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 38); \
  51520   __ret; \
  51521 })
  51522 #else
  51523 #define vld2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51524   poly64x2x2_t __ret; \
  51525   poly64x2x2_t __s1 = __p1; \
  51526   poly64x2x2_t __rev1; \
  51527   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51528   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51529   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 38); \
  51530  \
  51531   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51532   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51533   __ret; \
  51534 })
  51535 #endif
  51536 
  51537 #ifdef __LITTLE_ENDIAN__
  51538 #define vld2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  51539   uint8x16x2_t __ret; \
  51540   uint8x16x2_t __s1 = __p1; \
  51541   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 48); \
  51542   __ret; \
  51543 })
  51544 #else
  51545 #define vld2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  51546   uint8x16x2_t __ret; \
  51547   uint8x16x2_t __s1 = __p1; \
  51548   uint8x16x2_t __rev1; \
  51549   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51550   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51551   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 48); \
  51552  \
  51553   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51554   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51555   __ret; \
  51556 })
  51557 #endif
  51558 
  51559 #ifdef __LITTLE_ENDIAN__
  51560 #define vld2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  51561   uint64x2x2_t __ret; \
  51562   uint64x2x2_t __s1 = __p1; \
  51563   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 51); \
  51564   __ret; \
  51565 })
  51566 #else
  51567 #define vld2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  51568   uint64x2x2_t __ret; \
  51569   uint64x2x2_t __s1 = __p1; \
  51570   uint64x2x2_t __rev1; \
  51571   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51572   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51573   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 51); \
  51574  \
  51575   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51576   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51577   __ret; \
  51578 })
  51579 #endif
  51580 
  51581 #ifdef __LITTLE_ENDIAN__
  51582 #define vld2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  51583   int8x16x2_t __ret; \
  51584   int8x16x2_t __s1 = __p1; \
  51585   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 32); \
  51586   __ret; \
  51587 })
  51588 #else
  51589 #define vld2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  51590   int8x16x2_t __ret; \
  51591   int8x16x2_t __s1 = __p1; \
  51592   int8x16x2_t __rev1; \
  51593   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51594   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51595   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 32); \
  51596  \
  51597   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51598   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51599   __ret; \
  51600 })
  51601 #endif
  51602 
  51603 #ifdef __LITTLE_ENDIAN__
  51604 #define vld2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51605   float64x2x2_t __ret; \
  51606   float64x2x2_t __s1 = __p1; \
  51607   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 42); \
  51608   __ret; \
  51609 })
  51610 #else
  51611 #define vld2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51612   float64x2x2_t __ret; \
  51613   float64x2x2_t __s1 = __p1; \
  51614   float64x2x2_t __rev1; \
  51615   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51616   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51617   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 42); \
  51618  \
  51619   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51620   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51621   __ret; \
  51622 })
  51623 #endif
  51624 
  51625 #ifdef __LITTLE_ENDIAN__
  51626 #define vld2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  51627   int64x2x2_t __ret; \
  51628   int64x2x2_t __s1 = __p1; \
  51629   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 35); \
  51630   __ret; \
  51631 })
  51632 #else
  51633 #define vld2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  51634   int64x2x2_t __ret; \
  51635   int64x2x2_t __s1 = __p1; \
  51636   int64x2x2_t __rev1; \
  51637   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51638   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51639   __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 35); \
  51640  \
  51641   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51642   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51643   __ret; \
  51644 })
  51645 #endif
  51646 
  51647 #define vld2_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  51648   uint64x1x2_t __ret; \
  51649   uint64x1x2_t __s1 = __p1; \
  51650   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 19); \
  51651   __ret; \
  51652 })
  51653 #define vld2_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51654   float64x1x2_t __ret; \
  51655   float64x1x2_t __s1 = __p1; \
  51656   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 10); \
  51657   __ret; \
  51658 })
  51659 #define vld2_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  51660   int64x1x2_t __ret; \
  51661   int64x1x2_t __s1 = __p1; \
  51662   __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 3); \
  51663   __ret; \
  51664 })
  51665 #define vld3_p64(__p0) __extension__ ({ \
  51666   poly64x1x3_t __ret; \
  51667   __builtin_neon_vld3_v(&__ret, __p0, 6); \
  51668   __ret; \
  51669 })
  51670 #ifdef __LITTLE_ENDIAN__
  51671 #define vld3q_p64(__p0) __extension__ ({ \
  51672   poly64x2x3_t __ret; \
  51673   __builtin_neon_vld3q_v(&__ret, __p0, 38); \
  51674   __ret; \
  51675 })
  51676 #else
  51677 #define vld3q_p64(__p0) __extension__ ({ \
  51678   poly64x2x3_t __ret; \
  51679   __builtin_neon_vld3q_v(&__ret, __p0, 38); \
  51680  \
  51681   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51682   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51683   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51684   __ret; \
  51685 })
  51686 #endif
  51687 
  51688 #ifdef __LITTLE_ENDIAN__
  51689 #define vld3q_u64(__p0) __extension__ ({ \
  51690   uint64x2x3_t __ret; \
  51691   __builtin_neon_vld3q_v(&__ret, __p0, 51); \
  51692   __ret; \
  51693 })
  51694 #else
  51695 #define vld3q_u64(__p0) __extension__ ({ \
  51696   uint64x2x3_t __ret; \
  51697   __builtin_neon_vld3q_v(&__ret, __p0, 51); \
  51698  \
  51699   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51700   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51701   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51702   __ret; \
  51703 })
  51704 #endif
  51705 
  51706 #ifdef __LITTLE_ENDIAN__
  51707 #define vld3q_f64(__p0) __extension__ ({ \
  51708   float64x2x3_t __ret; \
  51709   __builtin_neon_vld3q_v(&__ret, __p0, 42); \
  51710   __ret; \
  51711 })
  51712 #else
  51713 #define vld3q_f64(__p0) __extension__ ({ \
  51714   float64x2x3_t __ret; \
  51715   __builtin_neon_vld3q_v(&__ret, __p0, 42); \
  51716  \
  51717   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51718   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51719   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51720   __ret; \
  51721 })
  51722 #endif
  51723 
  51724 #ifdef __LITTLE_ENDIAN__
  51725 #define vld3q_s64(__p0) __extension__ ({ \
  51726   int64x2x3_t __ret; \
  51727   __builtin_neon_vld3q_v(&__ret, __p0, 35); \
  51728   __ret; \
  51729 })
  51730 #else
  51731 #define vld3q_s64(__p0) __extension__ ({ \
  51732   int64x2x3_t __ret; \
  51733   __builtin_neon_vld3q_v(&__ret, __p0, 35); \
  51734  \
  51735   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51736   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51737   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51738   __ret; \
  51739 })
  51740 #endif
  51741 
  51742 #define vld3_f64(__p0) __extension__ ({ \
  51743   float64x1x3_t __ret; \
  51744   __builtin_neon_vld3_v(&__ret, __p0, 10); \
  51745   __ret; \
  51746 })
  51747 #define vld3_dup_p64(__p0) __extension__ ({ \
  51748   poly64x1x3_t __ret; \
  51749   __builtin_neon_vld3_dup_v(&__ret, __p0, 6); \
  51750   __ret; \
  51751 })
  51752 #ifdef __LITTLE_ENDIAN__
  51753 #define vld3q_dup_p64(__p0) __extension__ ({ \
  51754   poly64x2x3_t __ret; \
  51755   __builtin_neon_vld3q_dup_v(&__ret, __p0, 38); \
  51756   __ret; \
  51757 })
  51758 #else
  51759 #define vld3q_dup_p64(__p0) __extension__ ({ \
  51760   poly64x2x3_t __ret; \
  51761   __builtin_neon_vld3q_dup_v(&__ret, __p0, 38); \
  51762  \
  51763   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51764   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51765   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51766   __ret; \
  51767 })
  51768 #endif
  51769 
  51770 #ifdef __LITTLE_ENDIAN__
  51771 #define vld3q_dup_f64(__p0) __extension__ ({ \
  51772   float64x2x3_t __ret; \
  51773   __builtin_neon_vld3q_dup_v(&__ret, __p0, 42); \
  51774   __ret; \
  51775 })
  51776 #else
  51777 #define vld3q_dup_f64(__p0) __extension__ ({ \
  51778   float64x2x3_t __ret; \
  51779   __builtin_neon_vld3q_dup_v(&__ret, __p0, 42); \
  51780  \
  51781   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51782   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51783   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51784   __ret; \
  51785 })
  51786 #endif
  51787 
  51788 #define vld3_dup_f64(__p0) __extension__ ({ \
  51789   float64x1x3_t __ret; \
  51790   __builtin_neon_vld3_dup_v(&__ret, __p0, 10); \
  51791   __ret; \
  51792 })
  51793 #define vld3_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51794   poly64x1x3_t __ret; \
  51795   poly64x1x3_t __s1 = __p1; \
  51796   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 6); \
  51797   __ret; \
  51798 })
  51799 #ifdef __LITTLE_ENDIAN__
  51800 #define vld3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  51801   poly8x16x3_t __ret; \
  51802   poly8x16x3_t __s1 = __p1; \
  51803   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 36); \
  51804   __ret; \
  51805 })
  51806 #else
  51807 #define vld3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  51808   poly8x16x3_t __ret; \
  51809   poly8x16x3_t __s1 = __p1; \
  51810   poly8x16x3_t __rev1; \
  51811   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51812   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51813   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51814   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 36); \
  51815  \
  51816   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51817   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51818   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51819   __ret; \
  51820 })
  51821 #endif
  51822 
  51823 #ifdef __LITTLE_ENDIAN__
  51824 #define vld3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51825   poly64x2x3_t __ret; \
  51826   poly64x2x3_t __s1 = __p1; \
  51827   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 38); \
  51828   __ret; \
  51829 })
  51830 #else
  51831 #define vld3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  51832   poly64x2x3_t __ret; \
  51833   poly64x2x3_t __s1 = __p1; \
  51834   poly64x2x3_t __rev1; \
  51835   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51836   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51837   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  51838   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 38); \
  51839  \
  51840   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51841   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51842   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51843   __ret; \
  51844 })
  51845 #endif
  51846 
  51847 #ifdef __LITTLE_ENDIAN__
  51848 #define vld3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  51849   uint8x16x3_t __ret; \
  51850   uint8x16x3_t __s1 = __p1; \
  51851   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 48); \
  51852   __ret; \
  51853 })
  51854 #else
  51855 #define vld3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  51856   uint8x16x3_t __ret; \
  51857   uint8x16x3_t __s1 = __p1; \
  51858   uint8x16x3_t __rev1; \
  51859   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51860   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51861   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51862   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 48); \
  51863  \
  51864   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51865   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51866   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51867   __ret; \
  51868 })
  51869 #endif
  51870 
  51871 #ifdef __LITTLE_ENDIAN__
  51872 #define vld3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  51873   uint64x2x3_t __ret; \
  51874   uint64x2x3_t __s1 = __p1; \
  51875   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 51); \
  51876   __ret; \
  51877 })
  51878 #else
  51879 #define vld3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  51880   uint64x2x3_t __ret; \
  51881   uint64x2x3_t __s1 = __p1; \
  51882   uint64x2x3_t __rev1; \
  51883   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51884   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51885   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  51886   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 51); \
  51887  \
  51888   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51889   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51890   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51891   __ret; \
  51892 })
  51893 #endif
  51894 
  51895 #ifdef __LITTLE_ENDIAN__
  51896 #define vld3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  51897   int8x16x3_t __ret; \
  51898   int8x16x3_t __s1 = __p1; \
  51899   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 32); \
  51900   __ret; \
  51901 })
  51902 #else
  51903 #define vld3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  51904   int8x16x3_t __ret; \
  51905   int8x16x3_t __s1 = __p1; \
  51906   int8x16x3_t __rev1; \
  51907   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51908   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51909   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51910   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 32); \
  51911  \
  51912   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51913   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51914   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  51915   __ret; \
  51916 })
  51917 #endif
  51918 
  51919 #ifdef __LITTLE_ENDIAN__
  51920 #define vld3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51921   float64x2x3_t __ret; \
  51922   float64x2x3_t __s1 = __p1; \
  51923   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 42); \
  51924   __ret; \
  51925 })
  51926 #else
  51927 #define vld3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51928   float64x2x3_t __ret; \
  51929   float64x2x3_t __s1 = __p1; \
  51930   float64x2x3_t __rev1; \
  51931   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51932   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51933   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  51934   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 42); \
  51935  \
  51936   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51937   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51938   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51939   __ret; \
  51940 })
  51941 #endif
  51942 
  51943 #ifdef __LITTLE_ENDIAN__
  51944 #define vld3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  51945   int64x2x3_t __ret; \
  51946   int64x2x3_t __s1 = __p1; \
  51947   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 35); \
  51948   __ret; \
  51949 })
  51950 #else
  51951 #define vld3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  51952   int64x2x3_t __ret; \
  51953   int64x2x3_t __s1 = __p1; \
  51954   int64x2x3_t __rev1; \
  51955   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  51956   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  51957   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  51958   __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 35); \
  51959  \
  51960   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  51961   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  51962   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  51963   __ret; \
  51964 })
  51965 #endif
  51966 
  51967 #define vld3_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  51968   uint64x1x3_t __ret; \
  51969   uint64x1x3_t __s1 = __p1; \
  51970   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 19); \
  51971   __ret; \
  51972 })
  51973 #define vld3_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  51974   float64x1x3_t __ret; \
  51975   float64x1x3_t __s1 = __p1; \
  51976   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 10); \
  51977   __ret; \
  51978 })
  51979 #define vld3_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  51980   int64x1x3_t __ret; \
  51981   int64x1x3_t __s1 = __p1; \
  51982   __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 3); \
  51983   __ret; \
  51984 })
  51985 #define vld4_p64(__p0) __extension__ ({ \
  51986   poly64x1x4_t __ret; \
  51987   __builtin_neon_vld4_v(&__ret, __p0, 6); \
  51988   __ret; \
  51989 })
  51990 #ifdef __LITTLE_ENDIAN__
  51991 #define vld4q_p64(__p0) __extension__ ({ \
  51992   poly64x2x4_t __ret; \
  51993   __builtin_neon_vld4q_v(&__ret, __p0, 38); \
  51994   __ret; \
  51995 })
  51996 #else
  51997 #define vld4q_p64(__p0) __extension__ ({ \
  51998   poly64x2x4_t __ret; \
  51999   __builtin_neon_vld4q_v(&__ret, __p0, 38); \
  52000  \
  52001   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52002   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52003   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52004   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52005   __ret; \
  52006 })
  52007 #endif
  52008 
  52009 #ifdef __LITTLE_ENDIAN__
  52010 #define vld4q_u64(__p0) __extension__ ({ \
  52011   uint64x2x4_t __ret; \
  52012   __builtin_neon_vld4q_v(&__ret, __p0, 51); \
  52013   __ret; \
  52014 })
  52015 #else
  52016 #define vld4q_u64(__p0) __extension__ ({ \
  52017   uint64x2x4_t __ret; \
  52018   __builtin_neon_vld4q_v(&__ret, __p0, 51); \
  52019  \
  52020   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52021   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52022   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52023   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52024   __ret; \
  52025 })
  52026 #endif
  52027 
  52028 #ifdef __LITTLE_ENDIAN__
  52029 #define vld4q_f64(__p0) __extension__ ({ \
  52030   float64x2x4_t __ret; \
  52031   __builtin_neon_vld4q_v(&__ret, __p0, 42); \
  52032   __ret; \
  52033 })
  52034 #else
  52035 #define vld4q_f64(__p0) __extension__ ({ \
  52036   float64x2x4_t __ret; \
  52037   __builtin_neon_vld4q_v(&__ret, __p0, 42); \
  52038  \
  52039   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52040   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52041   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52042   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52043   __ret; \
  52044 })
  52045 #endif
  52046 
  52047 #ifdef __LITTLE_ENDIAN__
  52048 #define vld4q_s64(__p0) __extension__ ({ \
  52049   int64x2x4_t __ret; \
  52050   __builtin_neon_vld4q_v(&__ret, __p0, 35); \
  52051   __ret; \
  52052 })
  52053 #else
  52054 #define vld4q_s64(__p0) __extension__ ({ \
  52055   int64x2x4_t __ret; \
  52056   __builtin_neon_vld4q_v(&__ret, __p0, 35); \
  52057  \
  52058   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52059   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52060   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52061   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52062   __ret; \
  52063 })
  52064 #endif
  52065 
  52066 #define vld4_f64(__p0) __extension__ ({ \
  52067   float64x1x4_t __ret; \
  52068   __builtin_neon_vld4_v(&__ret, __p0, 10); \
  52069   __ret; \
  52070 })
  52071 #define vld4_dup_p64(__p0) __extension__ ({ \
  52072   poly64x1x4_t __ret; \
  52073   __builtin_neon_vld4_dup_v(&__ret, __p0, 6); \
  52074   __ret; \
  52075 })
  52076 #ifdef __LITTLE_ENDIAN__
  52077 #define vld4q_dup_p64(__p0) __extension__ ({ \
  52078   poly64x2x4_t __ret; \
  52079   __builtin_neon_vld4q_dup_v(&__ret, __p0, 38); \
  52080   __ret; \
  52081 })
  52082 #else
  52083 #define vld4q_dup_p64(__p0) __extension__ ({ \
  52084   poly64x2x4_t __ret; \
  52085   __builtin_neon_vld4q_dup_v(&__ret, __p0, 38); \
  52086  \
  52087   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52088   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52089   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52090   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52091   __ret; \
  52092 })
  52093 #endif
  52094 
  52095 #ifdef __LITTLE_ENDIAN__
  52096 #define vld4q_dup_f64(__p0) __extension__ ({ \
  52097   float64x2x4_t __ret; \
  52098   __builtin_neon_vld4q_dup_v(&__ret, __p0, 42); \
  52099   __ret; \
  52100 })
  52101 #else
  52102 #define vld4q_dup_f64(__p0) __extension__ ({ \
  52103   float64x2x4_t __ret; \
  52104   __builtin_neon_vld4q_dup_v(&__ret, __p0, 42); \
  52105  \
  52106   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52107   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52108   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52109   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52110   __ret; \
  52111 })
  52112 #endif
  52113 
  52114 #define vld4_dup_f64(__p0) __extension__ ({ \
  52115   float64x1x4_t __ret; \
  52116   __builtin_neon_vld4_dup_v(&__ret, __p0, 10); \
  52117   __ret; \
  52118 })
  52119 #define vld4_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  52120   poly64x1x4_t __ret; \
  52121   poly64x1x4_t __s1 = __p1; \
  52122   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 6); \
  52123   __ret; \
  52124 })
  52125 #ifdef __LITTLE_ENDIAN__
  52126 #define vld4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  52127   poly8x16x4_t __ret; \
  52128   poly8x16x4_t __s1 = __p1; \
  52129   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 36); \
  52130   __ret; \
  52131 })
  52132 #else
  52133 #define vld4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  52134   poly8x16x4_t __ret; \
  52135   poly8x16x4_t __s1 = __p1; \
  52136   poly8x16x4_t __rev1; \
  52137   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52138   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52139   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52140   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52141   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 36); \
  52142  \
  52143   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52144   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52145   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52146   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52147   __ret; \
  52148 })
  52149 #endif
  52150 
  52151 #ifdef __LITTLE_ENDIAN__
  52152 #define vld4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  52153   poly64x2x4_t __ret; \
  52154   poly64x2x4_t __s1 = __p1; \
  52155   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 38); \
  52156   __ret; \
  52157 })
  52158 #else
  52159 #define vld4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  52160   poly64x2x4_t __ret; \
  52161   poly64x2x4_t __s1 = __p1; \
  52162   poly64x2x4_t __rev1; \
  52163   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  52164   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  52165   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  52166   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  52167   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 38); \
  52168  \
  52169   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52170   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52171   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52172   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52173   __ret; \
  52174 })
  52175 #endif
  52176 
  52177 #ifdef __LITTLE_ENDIAN__
  52178 #define vld4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  52179   uint8x16x4_t __ret; \
  52180   uint8x16x4_t __s1 = __p1; \
  52181   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 48); \
  52182   __ret; \
  52183 })
  52184 #else
  52185 #define vld4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  52186   uint8x16x4_t __ret; \
  52187   uint8x16x4_t __s1 = __p1; \
  52188   uint8x16x4_t __rev1; \
  52189   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52190   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52191   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52192   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52193   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 48); \
  52194  \
  52195   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52196   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52197   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52198   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52199   __ret; \
  52200 })
  52201 #endif
  52202 
  52203 #ifdef __LITTLE_ENDIAN__
  52204 #define vld4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  52205   uint64x2x4_t __ret; \
  52206   uint64x2x4_t __s1 = __p1; \
  52207   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 51); \
  52208   __ret; \
  52209 })
  52210 #else
  52211 #define vld4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  52212   uint64x2x4_t __ret; \
  52213   uint64x2x4_t __s1 = __p1; \
  52214   uint64x2x4_t __rev1; \
  52215   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  52216   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  52217   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  52218   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  52219   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 51); \
  52220  \
  52221   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52222   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52223   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52224   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52225   __ret; \
  52226 })
  52227 #endif
  52228 
  52229 #ifdef __LITTLE_ENDIAN__
  52230 #define vld4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  52231   int8x16x4_t __ret; \
  52232   int8x16x4_t __s1 = __p1; \
  52233   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 32); \
  52234   __ret; \
  52235 })
  52236 #else
  52237 #define vld4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  52238   int8x16x4_t __ret; \
  52239   int8x16x4_t __s1 = __p1; \
  52240   int8x16x4_t __rev1; \
  52241   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52242   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52243   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52244   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52245   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 32); \
  52246  \
  52247   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52248   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52249   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52250   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  52251   __ret; \
  52252 })
  52253 #endif
  52254 
  52255 #ifdef __LITTLE_ENDIAN__
  52256 #define vld4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  52257   float64x2x4_t __ret; \
  52258   float64x2x4_t __s1 = __p1; \
  52259   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 42); \
  52260   __ret; \
  52261 })
  52262 #else
  52263 #define vld4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  52264   float64x2x4_t __ret; \
  52265   float64x2x4_t __s1 = __p1; \
  52266   float64x2x4_t __rev1; \
  52267   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  52268   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  52269   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  52270   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  52271   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 42); \
  52272  \
  52273   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52274   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52275   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52276   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52277   __ret; \
  52278 })
  52279 #endif
  52280 
  52281 #ifdef __LITTLE_ENDIAN__
  52282 #define vld4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  52283   int64x2x4_t __ret; \
  52284   int64x2x4_t __s1 = __p1; \
  52285   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 35); \
  52286   __ret; \
  52287 })
  52288 #else
  52289 #define vld4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  52290   int64x2x4_t __ret; \
  52291   int64x2x4_t __s1 = __p1; \
  52292   int64x2x4_t __rev1; \
  52293   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  52294   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  52295   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  52296   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  52297   __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 35); \
  52298  \
  52299   __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \
  52300   __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \
  52301   __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \
  52302   __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \
  52303   __ret; \
  52304 })
  52305 #endif
  52306 
  52307 #define vld4_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  52308   uint64x1x4_t __ret; \
  52309   uint64x1x4_t __s1 = __p1; \
  52310   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 19); \
  52311   __ret; \
  52312 })
  52313 #define vld4_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  52314   float64x1x4_t __ret; \
  52315   float64x1x4_t __s1 = __p1; \
  52316   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 10); \
  52317   __ret; \
  52318 })
  52319 #define vld4_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  52320   int64x1x4_t __ret; \
  52321   int64x1x4_t __s1 = __p1; \
  52322   __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 3); \
  52323   __ret; \
  52324 })
  52325 #define vldrq_p128(__p0) __extension__ ({ \
  52326   poly128_t __ret; \
  52327   __ret = (poly128_t) __builtin_neon_vldrq_p128(__p0); \
  52328   __ret; \
  52329 })
  52330 #ifdef __LITTLE_ENDIAN__
  52331 __ai __attribute__((target("neon"))) float64x2_t vmaxq_f64(float64x2_t __p0, float64x2_t __p1) {
  52332   float64x2_t __ret;
  52333   __ret = (float64x2_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  52334   return __ret;
  52335 }
  52336 #else
  52337 __ai __attribute__((target("neon"))) float64x2_t vmaxq_f64(float64x2_t __p0, float64x2_t __p1) {
  52338   float64x2_t __ret;
  52339   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52340   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  52341   __ret = (float64x2_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  52342   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  52343   return __ret;
  52344 }
  52345 #endif
  52346 
  52347 __ai __attribute__((target("neon"))) float64x1_t vmax_f64(float64x1_t __p0, float64x1_t __p1) {
  52348   float64x1_t __ret;
  52349   __ret = (float64x1_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  52350   return __ret;
  52351 }
  52352 #ifdef __LITTLE_ENDIAN__
  52353 __ai __attribute__((target("neon"))) float64_t vmaxnmvq_f64(float64x2_t __p0) {
  52354   float64_t __ret;
  52355   __ret = (float64_t) __builtin_neon_vmaxnmvq_f64(__p0);
  52356   return __ret;
  52357 }
  52358 #else
  52359 __ai __attribute__((target("neon"))) float64_t vmaxnmvq_f64(float64x2_t __p0) {
  52360   float64_t __ret;
  52361   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52362   __ret = (float64_t) __builtin_neon_vmaxnmvq_f64(__rev0);
  52363   return __ret;
  52364 }
  52365 #endif
  52366 
  52367 #ifdef __LITTLE_ENDIAN__
  52368 __ai __attribute__((target("neon"))) float32_t vmaxnmvq_f32(float32x4_t __p0) {
  52369   float32_t __ret;
  52370   __ret = (float32_t) __builtin_neon_vmaxnmvq_f32(__p0);
  52371   return __ret;
  52372 }
  52373 #else
  52374 __ai __attribute__((target("neon"))) float32_t vmaxnmvq_f32(float32x4_t __p0) {
  52375   float32_t __ret;
  52376   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52377   __ret = (float32_t) __builtin_neon_vmaxnmvq_f32(__rev0);
  52378   return __ret;
  52379 }
  52380 #endif
  52381 
  52382 #ifdef __LITTLE_ENDIAN__
  52383 __ai __attribute__((target("neon"))) float32_t vmaxnmv_f32(float32x2_t __p0) {
  52384   float32_t __ret;
  52385   __ret = (float32_t) __builtin_neon_vmaxnmv_f32(__p0);
  52386   return __ret;
  52387 }
  52388 #else
  52389 __ai __attribute__((target("neon"))) float32_t vmaxnmv_f32(float32x2_t __p0) {
  52390   float32_t __ret;
  52391   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52392   __ret = (float32_t) __builtin_neon_vmaxnmv_f32(__rev0);
  52393   return __ret;
  52394 }
  52395 #endif
  52396 
  52397 #ifdef __LITTLE_ENDIAN__
  52398 __ai __attribute__((target("neon"))) uint8_t vmaxvq_u8(uint8x16_t __p0) {
  52399   uint8_t __ret;
  52400   __ret = (uint8_t) __builtin_neon_vmaxvq_u8(__p0);
  52401   return __ret;
  52402 }
  52403 #else
  52404 __ai __attribute__((target("neon"))) uint8_t vmaxvq_u8(uint8x16_t __p0) {
  52405   uint8_t __ret;
  52406   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  52407   __ret = (uint8_t) __builtin_neon_vmaxvq_u8(__rev0);
  52408   return __ret;
  52409 }
  52410 #endif
  52411 
  52412 #ifdef __LITTLE_ENDIAN__
  52413 __ai __attribute__((target("neon"))) uint32_t vmaxvq_u32(uint32x4_t __p0) {
  52414   uint32_t __ret;
  52415   __ret = (uint32_t) __builtin_neon_vmaxvq_u32(__p0);
  52416   return __ret;
  52417 }
  52418 #else
  52419 __ai __attribute__((target("neon"))) uint32_t vmaxvq_u32(uint32x4_t __p0) {
  52420   uint32_t __ret;
  52421   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52422   __ret = (uint32_t) __builtin_neon_vmaxvq_u32(__rev0);
  52423   return __ret;
  52424 }
  52425 #endif
  52426 
  52427 #ifdef __LITTLE_ENDIAN__
  52428 __ai __attribute__((target("neon"))) uint16_t vmaxvq_u16(uint16x8_t __p0) {
  52429   uint16_t __ret;
  52430   __ret = (uint16_t) __builtin_neon_vmaxvq_u16(__p0);
  52431   return __ret;
  52432 }
  52433 #else
  52434 __ai __attribute__((target("neon"))) uint16_t vmaxvq_u16(uint16x8_t __p0) {
  52435   uint16_t __ret;
  52436   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52437   __ret = (uint16_t) __builtin_neon_vmaxvq_u16(__rev0);
  52438   return __ret;
  52439 }
  52440 #endif
  52441 
  52442 #ifdef __LITTLE_ENDIAN__
  52443 __ai __attribute__((target("neon"))) int8_t vmaxvq_s8(int8x16_t __p0) {
  52444   int8_t __ret;
  52445   __ret = (int8_t) __builtin_neon_vmaxvq_s8(__p0);
  52446   return __ret;
  52447 }
  52448 #else
  52449 __ai __attribute__((target("neon"))) int8_t vmaxvq_s8(int8x16_t __p0) {
  52450   int8_t __ret;
  52451   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  52452   __ret = (int8_t) __builtin_neon_vmaxvq_s8(__rev0);
  52453   return __ret;
  52454 }
  52455 #endif
  52456 
  52457 #ifdef __LITTLE_ENDIAN__
  52458 __ai __attribute__((target("neon"))) float64_t vmaxvq_f64(float64x2_t __p0) {
  52459   float64_t __ret;
  52460   __ret = (float64_t) __builtin_neon_vmaxvq_f64(__p0);
  52461   return __ret;
  52462 }
  52463 #else
  52464 __ai __attribute__((target("neon"))) float64_t vmaxvq_f64(float64x2_t __p0) {
  52465   float64_t __ret;
  52466   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52467   __ret = (float64_t) __builtin_neon_vmaxvq_f64(__rev0);
  52468   return __ret;
  52469 }
  52470 #endif
  52471 
  52472 #ifdef __LITTLE_ENDIAN__
  52473 __ai __attribute__((target("neon"))) float32_t vmaxvq_f32(float32x4_t __p0) {
  52474   float32_t __ret;
  52475   __ret = (float32_t) __builtin_neon_vmaxvq_f32(__p0);
  52476   return __ret;
  52477 }
  52478 #else
  52479 __ai __attribute__((target("neon"))) float32_t vmaxvq_f32(float32x4_t __p0) {
  52480   float32_t __ret;
  52481   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52482   __ret = (float32_t) __builtin_neon_vmaxvq_f32(__rev0);
  52483   return __ret;
  52484 }
  52485 #endif
  52486 
  52487 #ifdef __LITTLE_ENDIAN__
  52488 __ai __attribute__((target("neon"))) int32_t vmaxvq_s32(int32x4_t __p0) {
  52489   int32_t __ret;
  52490   __ret = (int32_t) __builtin_neon_vmaxvq_s32(__p0);
  52491   return __ret;
  52492 }
  52493 #else
  52494 __ai __attribute__((target("neon"))) int32_t vmaxvq_s32(int32x4_t __p0) {
  52495   int32_t __ret;
  52496   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52497   __ret = (int32_t) __builtin_neon_vmaxvq_s32(__rev0);
  52498   return __ret;
  52499 }
  52500 #endif
  52501 
  52502 #ifdef __LITTLE_ENDIAN__
  52503 __ai __attribute__((target("neon"))) int16_t vmaxvq_s16(int16x8_t __p0) {
  52504   int16_t __ret;
  52505   __ret = (int16_t) __builtin_neon_vmaxvq_s16(__p0);
  52506   return __ret;
  52507 }
  52508 #else
  52509 __ai __attribute__((target("neon"))) int16_t vmaxvq_s16(int16x8_t __p0) {
  52510   int16_t __ret;
  52511   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52512   __ret = (int16_t) __builtin_neon_vmaxvq_s16(__rev0);
  52513   return __ret;
  52514 }
  52515 #endif
  52516 
  52517 #ifdef __LITTLE_ENDIAN__
  52518 __ai __attribute__((target("neon"))) uint8_t vmaxv_u8(uint8x8_t __p0) {
  52519   uint8_t __ret;
  52520   __ret = (uint8_t) __builtin_neon_vmaxv_u8(__p0);
  52521   return __ret;
  52522 }
  52523 #else
  52524 __ai __attribute__((target("neon"))) uint8_t vmaxv_u8(uint8x8_t __p0) {
  52525   uint8_t __ret;
  52526   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52527   __ret = (uint8_t) __builtin_neon_vmaxv_u8(__rev0);
  52528   return __ret;
  52529 }
  52530 #endif
  52531 
  52532 #ifdef __LITTLE_ENDIAN__
  52533 __ai __attribute__((target("neon"))) uint32_t vmaxv_u32(uint32x2_t __p0) {
  52534   uint32_t __ret;
  52535   __ret = (uint32_t) __builtin_neon_vmaxv_u32(__p0);
  52536   return __ret;
  52537 }
  52538 #else
  52539 __ai __attribute__((target("neon"))) uint32_t vmaxv_u32(uint32x2_t __p0) {
  52540   uint32_t __ret;
  52541   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52542   __ret = (uint32_t) __builtin_neon_vmaxv_u32(__rev0);
  52543   return __ret;
  52544 }
  52545 #endif
  52546 
  52547 #ifdef __LITTLE_ENDIAN__
  52548 __ai __attribute__((target("neon"))) uint16_t vmaxv_u16(uint16x4_t __p0) {
  52549   uint16_t __ret;
  52550   __ret = (uint16_t) __builtin_neon_vmaxv_u16(__p0);
  52551   return __ret;
  52552 }
  52553 #else
  52554 __ai __attribute__((target("neon"))) uint16_t vmaxv_u16(uint16x4_t __p0) {
  52555   uint16_t __ret;
  52556   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52557   __ret = (uint16_t) __builtin_neon_vmaxv_u16(__rev0);
  52558   return __ret;
  52559 }
  52560 #endif
  52561 
  52562 #ifdef __LITTLE_ENDIAN__
  52563 __ai __attribute__((target("neon"))) int8_t vmaxv_s8(int8x8_t __p0) {
  52564   int8_t __ret;
  52565   __ret = (int8_t) __builtin_neon_vmaxv_s8(__p0);
  52566   return __ret;
  52567 }
  52568 #else
  52569 __ai __attribute__((target("neon"))) int8_t vmaxv_s8(int8x8_t __p0) {
  52570   int8_t __ret;
  52571   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52572   __ret = (int8_t) __builtin_neon_vmaxv_s8(__rev0);
  52573   return __ret;
  52574 }
  52575 #endif
  52576 
  52577 #ifdef __LITTLE_ENDIAN__
  52578 __ai __attribute__((target("neon"))) float32_t vmaxv_f32(float32x2_t __p0) {
  52579   float32_t __ret;
  52580   __ret = (float32_t) __builtin_neon_vmaxv_f32(__p0);
  52581   return __ret;
  52582 }
  52583 #else
  52584 __ai __attribute__((target("neon"))) float32_t vmaxv_f32(float32x2_t __p0) {
  52585   float32_t __ret;
  52586   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52587   __ret = (float32_t) __builtin_neon_vmaxv_f32(__rev0);
  52588   return __ret;
  52589 }
  52590 #endif
  52591 
  52592 #ifdef __LITTLE_ENDIAN__
  52593 __ai __attribute__((target("neon"))) int32_t vmaxv_s32(int32x2_t __p0) {
  52594   int32_t __ret;
  52595   __ret = (int32_t) __builtin_neon_vmaxv_s32(__p0);
  52596   return __ret;
  52597 }
  52598 #else
  52599 __ai __attribute__((target("neon"))) int32_t vmaxv_s32(int32x2_t __p0) {
  52600   int32_t __ret;
  52601   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52602   __ret = (int32_t) __builtin_neon_vmaxv_s32(__rev0);
  52603   return __ret;
  52604 }
  52605 #endif
  52606 
  52607 #ifdef __LITTLE_ENDIAN__
  52608 __ai __attribute__((target("neon"))) int16_t vmaxv_s16(int16x4_t __p0) {
  52609   int16_t __ret;
  52610   __ret = (int16_t) __builtin_neon_vmaxv_s16(__p0);
  52611   return __ret;
  52612 }
  52613 #else
  52614 __ai __attribute__((target("neon"))) int16_t vmaxv_s16(int16x4_t __p0) {
  52615   int16_t __ret;
  52616   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52617   __ret = (int16_t) __builtin_neon_vmaxv_s16(__rev0);
  52618   return __ret;
  52619 }
  52620 #endif
  52621 
  52622 #ifdef __LITTLE_ENDIAN__
  52623 __ai __attribute__((target("neon"))) float64x2_t vminq_f64(float64x2_t __p0, float64x2_t __p1) {
  52624   float64x2_t __ret;
  52625   __ret = (float64x2_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  52626   return __ret;
  52627 }
  52628 #else
  52629 __ai __attribute__((target("neon"))) float64x2_t vminq_f64(float64x2_t __p0, float64x2_t __p1) {
  52630   float64x2_t __ret;
  52631   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52632   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  52633   __ret = (float64x2_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  52634   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  52635   return __ret;
  52636 }
  52637 #endif
  52638 
  52639 __ai __attribute__((target("neon"))) float64x1_t vmin_f64(float64x1_t __p0, float64x1_t __p1) {
  52640   float64x1_t __ret;
  52641   __ret = (float64x1_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  52642   return __ret;
  52643 }
  52644 #ifdef __LITTLE_ENDIAN__
  52645 __ai __attribute__((target("neon"))) float64_t vminnmvq_f64(float64x2_t __p0) {
  52646   float64_t __ret;
  52647   __ret = (float64_t) __builtin_neon_vminnmvq_f64(__p0);
  52648   return __ret;
  52649 }
  52650 #else
  52651 __ai __attribute__((target("neon"))) float64_t vminnmvq_f64(float64x2_t __p0) {
  52652   float64_t __ret;
  52653   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52654   __ret = (float64_t) __builtin_neon_vminnmvq_f64(__rev0);
  52655   return __ret;
  52656 }
  52657 #endif
  52658 
  52659 #ifdef __LITTLE_ENDIAN__
  52660 __ai __attribute__((target("neon"))) float32_t vminnmvq_f32(float32x4_t __p0) {
  52661   float32_t __ret;
  52662   __ret = (float32_t) __builtin_neon_vminnmvq_f32(__p0);
  52663   return __ret;
  52664 }
  52665 #else
  52666 __ai __attribute__((target("neon"))) float32_t vminnmvq_f32(float32x4_t __p0) {
  52667   float32_t __ret;
  52668   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52669   __ret = (float32_t) __builtin_neon_vminnmvq_f32(__rev0);
  52670   return __ret;
  52671 }
  52672 #endif
  52673 
  52674 #ifdef __LITTLE_ENDIAN__
  52675 __ai __attribute__((target("neon"))) float32_t vminnmv_f32(float32x2_t __p0) {
  52676   float32_t __ret;
  52677   __ret = (float32_t) __builtin_neon_vminnmv_f32(__p0);
  52678   return __ret;
  52679 }
  52680 #else
  52681 __ai __attribute__((target("neon"))) float32_t vminnmv_f32(float32x2_t __p0) {
  52682   float32_t __ret;
  52683   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52684   __ret = (float32_t) __builtin_neon_vminnmv_f32(__rev0);
  52685   return __ret;
  52686 }
  52687 #endif
  52688 
  52689 #ifdef __LITTLE_ENDIAN__
  52690 __ai __attribute__((target("neon"))) uint8_t vminvq_u8(uint8x16_t __p0) {
  52691   uint8_t __ret;
  52692   __ret = (uint8_t) __builtin_neon_vminvq_u8(__p0);
  52693   return __ret;
  52694 }
  52695 #else
  52696 __ai __attribute__((target("neon"))) uint8_t vminvq_u8(uint8x16_t __p0) {
  52697   uint8_t __ret;
  52698   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  52699   __ret = (uint8_t) __builtin_neon_vminvq_u8(__rev0);
  52700   return __ret;
  52701 }
  52702 #endif
  52703 
  52704 #ifdef __LITTLE_ENDIAN__
  52705 __ai __attribute__((target("neon"))) uint32_t vminvq_u32(uint32x4_t __p0) {
  52706   uint32_t __ret;
  52707   __ret = (uint32_t) __builtin_neon_vminvq_u32(__p0);
  52708   return __ret;
  52709 }
  52710 #else
  52711 __ai __attribute__((target("neon"))) uint32_t vminvq_u32(uint32x4_t __p0) {
  52712   uint32_t __ret;
  52713   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52714   __ret = (uint32_t) __builtin_neon_vminvq_u32(__rev0);
  52715   return __ret;
  52716 }
  52717 #endif
  52718 
  52719 #ifdef __LITTLE_ENDIAN__
  52720 __ai __attribute__((target("neon"))) uint16_t vminvq_u16(uint16x8_t __p0) {
  52721   uint16_t __ret;
  52722   __ret = (uint16_t) __builtin_neon_vminvq_u16(__p0);
  52723   return __ret;
  52724 }
  52725 #else
  52726 __ai __attribute__((target("neon"))) uint16_t vminvq_u16(uint16x8_t __p0) {
  52727   uint16_t __ret;
  52728   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52729   __ret = (uint16_t) __builtin_neon_vminvq_u16(__rev0);
  52730   return __ret;
  52731 }
  52732 #endif
  52733 
  52734 #ifdef __LITTLE_ENDIAN__
  52735 __ai __attribute__((target("neon"))) int8_t vminvq_s8(int8x16_t __p0) {
  52736   int8_t __ret;
  52737   __ret = (int8_t) __builtin_neon_vminvq_s8(__p0);
  52738   return __ret;
  52739 }
  52740 #else
  52741 __ai __attribute__((target("neon"))) int8_t vminvq_s8(int8x16_t __p0) {
  52742   int8_t __ret;
  52743   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  52744   __ret = (int8_t) __builtin_neon_vminvq_s8(__rev0);
  52745   return __ret;
  52746 }
  52747 #endif
  52748 
  52749 #ifdef __LITTLE_ENDIAN__
  52750 __ai __attribute__((target("neon"))) float64_t vminvq_f64(float64x2_t __p0) {
  52751   float64_t __ret;
  52752   __ret = (float64_t) __builtin_neon_vminvq_f64(__p0);
  52753   return __ret;
  52754 }
  52755 #else
  52756 __ai __attribute__((target("neon"))) float64_t vminvq_f64(float64x2_t __p0) {
  52757   float64_t __ret;
  52758   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52759   __ret = (float64_t) __builtin_neon_vminvq_f64(__rev0);
  52760   return __ret;
  52761 }
  52762 #endif
  52763 
  52764 #ifdef __LITTLE_ENDIAN__
  52765 __ai __attribute__((target("neon"))) float32_t vminvq_f32(float32x4_t __p0) {
  52766   float32_t __ret;
  52767   __ret = (float32_t) __builtin_neon_vminvq_f32(__p0);
  52768   return __ret;
  52769 }
  52770 #else
  52771 __ai __attribute__((target("neon"))) float32_t vminvq_f32(float32x4_t __p0) {
  52772   float32_t __ret;
  52773   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52774   __ret = (float32_t) __builtin_neon_vminvq_f32(__rev0);
  52775   return __ret;
  52776 }
  52777 #endif
  52778 
  52779 #ifdef __LITTLE_ENDIAN__
  52780 __ai __attribute__((target("neon"))) int32_t vminvq_s32(int32x4_t __p0) {
  52781   int32_t __ret;
  52782   __ret = (int32_t) __builtin_neon_vminvq_s32(__p0);
  52783   return __ret;
  52784 }
  52785 #else
  52786 __ai __attribute__((target("neon"))) int32_t vminvq_s32(int32x4_t __p0) {
  52787   int32_t __ret;
  52788   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52789   __ret = (int32_t) __builtin_neon_vminvq_s32(__rev0);
  52790   return __ret;
  52791 }
  52792 #endif
  52793 
  52794 #ifdef __LITTLE_ENDIAN__
  52795 __ai __attribute__((target("neon"))) int16_t vminvq_s16(int16x8_t __p0) {
  52796   int16_t __ret;
  52797   __ret = (int16_t) __builtin_neon_vminvq_s16(__p0);
  52798   return __ret;
  52799 }
  52800 #else
  52801 __ai __attribute__((target("neon"))) int16_t vminvq_s16(int16x8_t __p0) {
  52802   int16_t __ret;
  52803   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52804   __ret = (int16_t) __builtin_neon_vminvq_s16(__rev0);
  52805   return __ret;
  52806 }
  52807 #endif
  52808 
  52809 #ifdef __LITTLE_ENDIAN__
  52810 __ai __attribute__((target("neon"))) uint8_t vminv_u8(uint8x8_t __p0) {
  52811   uint8_t __ret;
  52812   __ret = (uint8_t) __builtin_neon_vminv_u8(__p0);
  52813   return __ret;
  52814 }
  52815 #else
  52816 __ai __attribute__((target("neon"))) uint8_t vminv_u8(uint8x8_t __p0) {
  52817   uint8_t __ret;
  52818   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52819   __ret = (uint8_t) __builtin_neon_vminv_u8(__rev0);
  52820   return __ret;
  52821 }
  52822 #endif
  52823 
  52824 #ifdef __LITTLE_ENDIAN__
  52825 __ai __attribute__((target("neon"))) uint32_t vminv_u32(uint32x2_t __p0) {
  52826   uint32_t __ret;
  52827   __ret = (uint32_t) __builtin_neon_vminv_u32(__p0);
  52828   return __ret;
  52829 }
  52830 #else
  52831 __ai __attribute__((target("neon"))) uint32_t vminv_u32(uint32x2_t __p0) {
  52832   uint32_t __ret;
  52833   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52834   __ret = (uint32_t) __builtin_neon_vminv_u32(__rev0);
  52835   return __ret;
  52836 }
  52837 #endif
  52838 
  52839 #ifdef __LITTLE_ENDIAN__
  52840 __ai __attribute__((target("neon"))) uint16_t vminv_u16(uint16x4_t __p0) {
  52841   uint16_t __ret;
  52842   __ret = (uint16_t) __builtin_neon_vminv_u16(__p0);
  52843   return __ret;
  52844 }
  52845 #else
  52846 __ai __attribute__((target("neon"))) uint16_t vminv_u16(uint16x4_t __p0) {
  52847   uint16_t __ret;
  52848   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52849   __ret = (uint16_t) __builtin_neon_vminv_u16(__rev0);
  52850   return __ret;
  52851 }
  52852 #endif
  52853 
  52854 #ifdef __LITTLE_ENDIAN__
  52855 __ai __attribute__((target("neon"))) int8_t vminv_s8(int8x8_t __p0) {
  52856   int8_t __ret;
  52857   __ret = (int8_t) __builtin_neon_vminv_s8(__p0);
  52858   return __ret;
  52859 }
  52860 #else
  52861 __ai __attribute__((target("neon"))) int8_t vminv_s8(int8x8_t __p0) {
  52862   int8_t __ret;
  52863   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  52864   __ret = (int8_t) __builtin_neon_vminv_s8(__rev0);
  52865   return __ret;
  52866 }
  52867 #endif
  52868 
  52869 #ifdef __LITTLE_ENDIAN__
  52870 __ai __attribute__((target("neon"))) float32_t vminv_f32(float32x2_t __p0) {
  52871   float32_t __ret;
  52872   __ret = (float32_t) __builtin_neon_vminv_f32(__p0);
  52873   return __ret;
  52874 }
  52875 #else
  52876 __ai __attribute__((target("neon"))) float32_t vminv_f32(float32x2_t __p0) {
  52877   float32_t __ret;
  52878   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52879   __ret = (float32_t) __builtin_neon_vminv_f32(__rev0);
  52880   return __ret;
  52881 }
  52882 #endif
  52883 
  52884 #ifdef __LITTLE_ENDIAN__
  52885 __ai __attribute__((target("neon"))) int32_t vminv_s32(int32x2_t __p0) {
  52886   int32_t __ret;
  52887   __ret = (int32_t) __builtin_neon_vminv_s32(__p0);
  52888   return __ret;
  52889 }
  52890 #else
  52891 __ai __attribute__((target("neon"))) int32_t vminv_s32(int32x2_t __p0) {
  52892   int32_t __ret;
  52893   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52894   __ret = (int32_t) __builtin_neon_vminv_s32(__rev0);
  52895   return __ret;
  52896 }
  52897 #endif
  52898 
  52899 #ifdef __LITTLE_ENDIAN__
  52900 __ai __attribute__((target("neon"))) int16_t vminv_s16(int16x4_t __p0) {
  52901   int16_t __ret;
  52902   __ret = (int16_t) __builtin_neon_vminv_s16(__p0);
  52903   return __ret;
  52904 }
  52905 #else
  52906 __ai __attribute__((target("neon"))) int16_t vminv_s16(int16x4_t __p0) {
  52907   int16_t __ret;
  52908   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  52909   __ret = (int16_t) __builtin_neon_vminv_s16(__rev0);
  52910   return __ret;
  52911 }
  52912 #endif
  52913 
  52914 #ifdef __LITTLE_ENDIAN__
  52915 __ai __attribute__((target("neon"))) float64x2_t vmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  52916   float64x2_t __ret;
  52917   __ret = __p0 + __p1 * __p2;
  52918   return __ret;
  52919 }
  52920 #else
  52921 __ai __attribute__((target("neon"))) float64x2_t vmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  52922   float64x2_t __ret;
  52923   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  52924   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  52925   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  52926   __ret = __rev0 + __rev1 * __rev2;
  52927   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  52928   return __ret;
  52929 }
  52930 #endif
  52931 
  52932 __ai __attribute__((target("neon"))) float64x1_t vmla_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) {
  52933   float64x1_t __ret;
  52934   __ret = __p0 + __p1 * __p2;
  52935   return __ret;
  52936 }
  52937 #ifdef __LITTLE_ENDIAN__
  52938 #define vmlaq_laneq_u32(__p0_448, __p1_448, __p2_448, __p3_448) __extension__ ({ \
  52939   uint32x4_t __ret_448; \
  52940   uint32x4_t __s0_448 = __p0_448; \
  52941   uint32x4_t __s1_448 = __p1_448; \
  52942   uint32x4_t __s2_448 = __p2_448; \
  52943   __ret_448 = __s0_448 + __s1_448 * splatq_laneq_u32(__s2_448, __p3_448); \
  52944   __ret_448; \
  52945 })
  52946 #else
  52947 #define vmlaq_laneq_u32(__p0_449, __p1_449, __p2_449, __p3_449) __extension__ ({ \
  52948   uint32x4_t __ret_449; \
  52949   uint32x4_t __s0_449 = __p0_449; \
  52950   uint32x4_t __s1_449 = __p1_449; \
  52951   uint32x4_t __s2_449 = __p2_449; \
  52952   uint32x4_t __rev0_449;  __rev0_449 = __builtin_shufflevector(__s0_449, __s0_449, 3, 2, 1, 0); \
  52953   uint32x4_t __rev1_449;  __rev1_449 = __builtin_shufflevector(__s1_449, __s1_449, 3, 2, 1, 0); \
  52954   uint32x4_t __rev2_449;  __rev2_449 = __builtin_shufflevector(__s2_449, __s2_449, 3, 2, 1, 0); \
  52955   __ret_449 = __rev0_449 + __rev1_449 * __noswap_splatq_laneq_u32(__rev2_449, __p3_449); \
  52956   __ret_449 = __builtin_shufflevector(__ret_449, __ret_449, 3, 2, 1, 0); \
  52957   __ret_449; \
  52958 })
  52959 #endif
  52960 
  52961 #ifdef __LITTLE_ENDIAN__
  52962 #define vmlaq_laneq_u16(__p0_450, __p1_450, __p2_450, __p3_450) __extension__ ({ \
  52963   uint16x8_t __ret_450; \
  52964   uint16x8_t __s0_450 = __p0_450; \
  52965   uint16x8_t __s1_450 = __p1_450; \
  52966   uint16x8_t __s2_450 = __p2_450; \
  52967   __ret_450 = __s0_450 + __s1_450 * splatq_laneq_u16(__s2_450, __p3_450); \
  52968   __ret_450; \
  52969 })
  52970 #else
  52971 #define vmlaq_laneq_u16(__p0_451, __p1_451, __p2_451, __p3_451) __extension__ ({ \
  52972   uint16x8_t __ret_451; \
  52973   uint16x8_t __s0_451 = __p0_451; \
  52974   uint16x8_t __s1_451 = __p1_451; \
  52975   uint16x8_t __s2_451 = __p2_451; \
  52976   uint16x8_t __rev0_451;  __rev0_451 = __builtin_shufflevector(__s0_451, __s0_451, 7, 6, 5, 4, 3, 2, 1, 0); \
  52977   uint16x8_t __rev1_451;  __rev1_451 = __builtin_shufflevector(__s1_451, __s1_451, 7, 6, 5, 4, 3, 2, 1, 0); \
  52978   uint16x8_t __rev2_451;  __rev2_451 = __builtin_shufflevector(__s2_451, __s2_451, 7, 6, 5, 4, 3, 2, 1, 0); \
  52979   __ret_451 = __rev0_451 + __rev1_451 * __noswap_splatq_laneq_u16(__rev2_451, __p3_451); \
  52980   __ret_451 = __builtin_shufflevector(__ret_451, __ret_451, 7, 6, 5, 4, 3, 2, 1, 0); \
  52981   __ret_451; \
  52982 })
  52983 #endif
  52984 
  52985 #ifdef __LITTLE_ENDIAN__
  52986 #define vmlaq_laneq_f32(__p0_452, __p1_452, __p2_452, __p3_452) __extension__ ({ \
  52987   float32x4_t __ret_452; \
  52988   float32x4_t __s0_452 = __p0_452; \
  52989   float32x4_t __s1_452 = __p1_452; \
  52990   float32x4_t __s2_452 = __p2_452; \
  52991   __ret_452 = __s0_452 + __s1_452 * splatq_laneq_f32(__s2_452, __p3_452); \
  52992   __ret_452; \
  52993 })
  52994 #else
  52995 #define vmlaq_laneq_f32(__p0_453, __p1_453, __p2_453, __p3_453) __extension__ ({ \
  52996   float32x4_t __ret_453; \
  52997   float32x4_t __s0_453 = __p0_453; \
  52998   float32x4_t __s1_453 = __p1_453; \
  52999   float32x4_t __s2_453 = __p2_453; \
  53000   float32x4_t __rev0_453;  __rev0_453 = __builtin_shufflevector(__s0_453, __s0_453, 3, 2, 1, 0); \
  53001   float32x4_t __rev1_453;  __rev1_453 = __builtin_shufflevector(__s1_453, __s1_453, 3, 2, 1, 0); \
  53002   float32x4_t __rev2_453;  __rev2_453 = __builtin_shufflevector(__s2_453, __s2_453, 3, 2, 1, 0); \
  53003   __ret_453 = __rev0_453 + __rev1_453 * __noswap_splatq_laneq_f32(__rev2_453, __p3_453); \
  53004   __ret_453 = __builtin_shufflevector(__ret_453, __ret_453, 3, 2, 1, 0); \
  53005   __ret_453; \
  53006 })
  53007 #endif
  53008 
  53009 #ifdef __LITTLE_ENDIAN__
  53010 #define vmlaq_laneq_s32(__p0_454, __p1_454, __p2_454, __p3_454) __extension__ ({ \
  53011   int32x4_t __ret_454; \
  53012   int32x4_t __s0_454 = __p0_454; \
  53013   int32x4_t __s1_454 = __p1_454; \
  53014   int32x4_t __s2_454 = __p2_454; \
  53015   __ret_454 = __s0_454 + __s1_454 * splatq_laneq_s32(__s2_454, __p3_454); \
  53016   __ret_454; \
  53017 })
  53018 #else
  53019 #define vmlaq_laneq_s32(__p0_455, __p1_455, __p2_455, __p3_455) __extension__ ({ \
  53020   int32x4_t __ret_455; \
  53021   int32x4_t __s0_455 = __p0_455; \
  53022   int32x4_t __s1_455 = __p1_455; \
  53023   int32x4_t __s2_455 = __p2_455; \
  53024   int32x4_t __rev0_455;  __rev0_455 = __builtin_shufflevector(__s0_455, __s0_455, 3, 2, 1, 0); \
  53025   int32x4_t __rev1_455;  __rev1_455 = __builtin_shufflevector(__s1_455, __s1_455, 3, 2, 1, 0); \
  53026   int32x4_t __rev2_455;  __rev2_455 = __builtin_shufflevector(__s2_455, __s2_455, 3, 2, 1, 0); \
  53027   __ret_455 = __rev0_455 + __rev1_455 * __noswap_splatq_laneq_s32(__rev2_455, __p3_455); \
  53028   __ret_455 = __builtin_shufflevector(__ret_455, __ret_455, 3, 2, 1, 0); \
  53029   __ret_455; \
  53030 })
  53031 #endif
  53032 
  53033 #ifdef __LITTLE_ENDIAN__
  53034 #define vmlaq_laneq_s16(__p0_456, __p1_456, __p2_456, __p3_456) __extension__ ({ \
  53035   int16x8_t __ret_456; \
  53036   int16x8_t __s0_456 = __p0_456; \
  53037   int16x8_t __s1_456 = __p1_456; \
  53038   int16x8_t __s2_456 = __p2_456; \
  53039   __ret_456 = __s0_456 + __s1_456 * splatq_laneq_s16(__s2_456, __p3_456); \
  53040   __ret_456; \
  53041 })
  53042 #else
  53043 #define vmlaq_laneq_s16(__p0_457, __p1_457, __p2_457, __p3_457) __extension__ ({ \
  53044   int16x8_t __ret_457; \
  53045   int16x8_t __s0_457 = __p0_457; \
  53046   int16x8_t __s1_457 = __p1_457; \
  53047   int16x8_t __s2_457 = __p2_457; \
  53048   int16x8_t __rev0_457;  __rev0_457 = __builtin_shufflevector(__s0_457, __s0_457, 7, 6, 5, 4, 3, 2, 1, 0); \
  53049   int16x8_t __rev1_457;  __rev1_457 = __builtin_shufflevector(__s1_457, __s1_457, 7, 6, 5, 4, 3, 2, 1, 0); \
  53050   int16x8_t __rev2_457;  __rev2_457 = __builtin_shufflevector(__s2_457, __s2_457, 7, 6, 5, 4, 3, 2, 1, 0); \
  53051   __ret_457 = __rev0_457 + __rev1_457 * __noswap_splatq_laneq_s16(__rev2_457, __p3_457); \
  53052   __ret_457 = __builtin_shufflevector(__ret_457, __ret_457, 7, 6, 5, 4, 3, 2, 1, 0); \
  53053   __ret_457; \
  53054 })
  53055 #endif
  53056 
  53057 #ifdef __LITTLE_ENDIAN__
  53058 #define vmla_laneq_u32(__p0_458, __p1_458, __p2_458, __p3_458) __extension__ ({ \
  53059   uint32x2_t __ret_458; \
  53060   uint32x2_t __s0_458 = __p0_458; \
  53061   uint32x2_t __s1_458 = __p1_458; \
  53062   uint32x4_t __s2_458 = __p2_458; \
  53063   __ret_458 = __s0_458 + __s1_458 * splat_laneq_u32(__s2_458, __p3_458); \
  53064   __ret_458; \
  53065 })
  53066 #else
  53067 #define vmla_laneq_u32(__p0_459, __p1_459, __p2_459, __p3_459) __extension__ ({ \
  53068   uint32x2_t __ret_459; \
  53069   uint32x2_t __s0_459 = __p0_459; \
  53070   uint32x2_t __s1_459 = __p1_459; \
  53071   uint32x4_t __s2_459 = __p2_459; \
  53072   uint32x2_t __rev0_459;  __rev0_459 = __builtin_shufflevector(__s0_459, __s0_459, 1, 0); \
  53073   uint32x2_t __rev1_459;  __rev1_459 = __builtin_shufflevector(__s1_459, __s1_459, 1, 0); \
  53074   uint32x4_t __rev2_459;  __rev2_459 = __builtin_shufflevector(__s2_459, __s2_459, 3, 2, 1, 0); \
  53075   __ret_459 = __rev0_459 + __rev1_459 * __noswap_splat_laneq_u32(__rev2_459, __p3_459); \
  53076   __ret_459 = __builtin_shufflevector(__ret_459, __ret_459, 1, 0); \
  53077   __ret_459; \
  53078 })
  53079 #endif
  53080 
  53081 #ifdef __LITTLE_ENDIAN__
  53082 #define vmla_laneq_u16(__p0_460, __p1_460, __p2_460, __p3_460) __extension__ ({ \
  53083   uint16x4_t __ret_460; \
  53084   uint16x4_t __s0_460 = __p0_460; \
  53085   uint16x4_t __s1_460 = __p1_460; \
  53086   uint16x8_t __s2_460 = __p2_460; \
  53087   __ret_460 = __s0_460 + __s1_460 * splat_laneq_u16(__s2_460, __p3_460); \
  53088   __ret_460; \
  53089 })
  53090 #else
  53091 #define vmla_laneq_u16(__p0_461, __p1_461, __p2_461, __p3_461) __extension__ ({ \
  53092   uint16x4_t __ret_461; \
  53093   uint16x4_t __s0_461 = __p0_461; \
  53094   uint16x4_t __s1_461 = __p1_461; \
  53095   uint16x8_t __s2_461 = __p2_461; \
  53096   uint16x4_t __rev0_461;  __rev0_461 = __builtin_shufflevector(__s0_461, __s0_461, 3, 2, 1, 0); \
  53097   uint16x4_t __rev1_461;  __rev1_461 = __builtin_shufflevector(__s1_461, __s1_461, 3, 2, 1, 0); \
  53098   uint16x8_t __rev2_461;  __rev2_461 = __builtin_shufflevector(__s2_461, __s2_461, 7, 6, 5, 4, 3, 2, 1, 0); \
  53099   __ret_461 = __rev0_461 + __rev1_461 * __noswap_splat_laneq_u16(__rev2_461, __p3_461); \
  53100   __ret_461 = __builtin_shufflevector(__ret_461, __ret_461, 3, 2, 1, 0); \
  53101   __ret_461; \
  53102 })
  53103 #endif
  53104 
  53105 #ifdef __LITTLE_ENDIAN__
  53106 #define vmla_laneq_f32(__p0_462, __p1_462, __p2_462, __p3_462) __extension__ ({ \
  53107   float32x2_t __ret_462; \
  53108   float32x2_t __s0_462 = __p0_462; \
  53109   float32x2_t __s1_462 = __p1_462; \
  53110   float32x4_t __s2_462 = __p2_462; \
  53111   __ret_462 = __s0_462 + __s1_462 * splat_laneq_f32(__s2_462, __p3_462); \
  53112   __ret_462; \
  53113 })
  53114 #else
  53115 #define vmla_laneq_f32(__p0_463, __p1_463, __p2_463, __p3_463) __extension__ ({ \
  53116   float32x2_t __ret_463; \
  53117   float32x2_t __s0_463 = __p0_463; \
  53118   float32x2_t __s1_463 = __p1_463; \
  53119   float32x4_t __s2_463 = __p2_463; \
  53120   float32x2_t __rev0_463;  __rev0_463 = __builtin_shufflevector(__s0_463, __s0_463, 1, 0); \
  53121   float32x2_t __rev1_463;  __rev1_463 = __builtin_shufflevector(__s1_463, __s1_463, 1, 0); \
  53122   float32x4_t __rev2_463;  __rev2_463 = __builtin_shufflevector(__s2_463, __s2_463, 3, 2, 1, 0); \
  53123   __ret_463 = __rev0_463 + __rev1_463 * __noswap_splat_laneq_f32(__rev2_463, __p3_463); \
  53124   __ret_463 = __builtin_shufflevector(__ret_463, __ret_463, 1, 0); \
  53125   __ret_463; \
  53126 })
  53127 #endif
  53128 
  53129 #ifdef __LITTLE_ENDIAN__
  53130 #define vmla_laneq_s32(__p0_464, __p1_464, __p2_464, __p3_464) __extension__ ({ \
  53131   int32x2_t __ret_464; \
  53132   int32x2_t __s0_464 = __p0_464; \
  53133   int32x2_t __s1_464 = __p1_464; \
  53134   int32x4_t __s2_464 = __p2_464; \
  53135   __ret_464 = __s0_464 + __s1_464 * splat_laneq_s32(__s2_464, __p3_464); \
  53136   __ret_464; \
  53137 })
  53138 #else
  53139 #define vmla_laneq_s32(__p0_465, __p1_465, __p2_465, __p3_465) __extension__ ({ \
  53140   int32x2_t __ret_465; \
  53141   int32x2_t __s0_465 = __p0_465; \
  53142   int32x2_t __s1_465 = __p1_465; \
  53143   int32x4_t __s2_465 = __p2_465; \
  53144   int32x2_t __rev0_465;  __rev0_465 = __builtin_shufflevector(__s0_465, __s0_465, 1, 0); \
  53145   int32x2_t __rev1_465;  __rev1_465 = __builtin_shufflevector(__s1_465, __s1_465, 1, 0); \
  53146   int32x4_t __rev2_465;  __rev2_465 = __builtin_shufflevector(__s2_465, __s2_465, 3, 2, 1, 0); \
  53147   __ret_465 = __rev0_465 + __rev1_465 * __noswap_splat_laneq_s32(__rev2_465, __p3_465); \
  53148   __ret_465 = __builtin_shufflevector(__ret_465, __ret_465, 1, 0); \
  53149   __ret_465; \
  53150 })
  53151 #endif
  53152 
  53153 #ifdef __LITTLE_ENDIAN__
  53154 #define vmla_laneq_s16(__p0_466, __p1_466, __p2_466, __p3_466) __extension__ ({ \
  53155   int16x4_t __ret_466; \
  53156   int16x4_t __s0_466 = __p0_466; \
  53157   int16x4_t __s1_466 = __p1_466; \
  53158   int16x8_t __s2_466 = __p2_466; \
  53159   __ret_466 = __s0_466 + __s1_466 * splat_laneq_s16(__s2_466, __p3_466); \
  53160   __ret_466; \
  53161 })
  53162 #else
  53163 #define vmla_laneq_s16(__p0_467, __p1_467, __p2_467, __p3_467) __extension__ ({ \
  53164   int16x4_t __ret_467; \
  53165   int16x4_t __s0_467 = __p0_467; \
  53166   int16x4_t __s1_467 = __p1_467; \
  53167   int16x8_t __s2_467 = __p2_467; \
  53168   int16x4_t __rev0_467;  __rev0_467 = __builtin_shufflevector(__s0_467, __s0_467, 3, 2, 1, 0); \
  53169   int16x4_t __rev1_467;  __rev1_467 = __builtin_shufflevector(__s1_467, __s1_467, 3, 2, 1, 0); \
  53170   int16x8_t __rev2_467;  __rev2_467 = __builtin_shufflevector(__s2_467, __s2_467, 7, 6, 5, 4, 3, 2, 1, 0); \
  53171   __ret_467 = __rev0_467 + __rev1_467 * __noswap_splat_laneq_s16(__rev2_467, __p3_467); \
  53172   __ret_467 = __builtin_shufflevector(__ret_467, __ret_467, 3, 2, 1, 0); \
  53173   __ret_467; \
  53174 })
  53175 #endif
  53176 
  53177 #ifdef __LITTLE_ENDIAN__
  53178 #define vmlal_high_lane_u32(__p0_468, __p1_468, __p2_468, __p3_468) __extension__ ({ \
  53179   uint64x2_t __ret_468; \
  53180   uint64x2_t __s0_468 = __p0_468; \
  53181   uint32x4_t __s1_468 = __p1_468; \
  53182   uint32x2_t __s2_468 = __p2_468; \
  53183   __ret_468 = __s0_468 + vmull_u32(vget_high_u32(__s1_468), splat_lane_u32(__s2_468, __p3_468)); \
  53184   __ret_468; \
  53185 })
  53186 #else
  53187 #define vmlal_high_lane_u32(__p0_469, __p1_469, __p2_469, __p3_469) __extension__ ({ \
  53188   uint64x2_t __ret_469; \
  53189   uint64x2_t __s0_469 = __p0_469; \
  53190   uint32x4_t __s1_469 = __p1_469; \
  53191   uint32x2_t __s2_469 = __p2_469; \
  53192   uint64x2_t __rev0_469;  __rev0_469 = __builtin_shufflevector(__s0_469, __s0_469, 1, 0); \
  53193   uint32x4_t __rev1_469;  __rev1_469 = __builtin_shufflevector(__s1_469, __s1_469, 3, 2, 1, 0); \
  53194   uint32x2_t __rev2_469;  __rev2_469 = __builtin_shufflevector(__s2_469, __s2_469, 1, 0); \
  53195   __ret_469 = __rev0_469 + __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_469), __noswap_splat_lane_u32(__rev2_469, __p3_469)); \
  53196   __ret_469 = __builtin_shufflevector(__ret_469, __ret_469, 1, 0); \
  53197   __ret_469; \
  53198 })
  53199 #endif
  53200 
  53201 #ifdef __LITTLE_ENDIAN__
  53202 #define vmlal_high_lane_u16(__p0_470, __p1_470, __p2_470, __p3_470) __extension__ ({ \
  53203   uint32x4_t __ret_470; \
  53204   uint32x4_t __s0_470 = __p0_470; \
  53205   uint16x8_t __s1_470 = __p1_470; \
  53206   uint16x4_t __s2_470 = __p2_470; \
  53207   __ret_470 = __s0_470 + vmull_u16(vget_high_u16(__s1_470), splat_lane_u16(__s2_470, __p3_470)); \
  53208   __ret_470; \
  53209 })
  53210 #else
  53211 #define vmlal_high_lane_u16(__p0_471, __p1_471, __p2_471, __p3_471) __extension__ ({ \
  53212   uint32x4_t __ret_471; \
  53213   uint32x4_t __s0_471 = __p0_471; \
  53214   uint16x8_t __s1_471 = __p1_471; \
  53215   uint16x4_t __s2_471 = __p2_471; \
  53216   uint32x4_t __rev0_471;  __rev0_471 = __builtin_shufflevector(__s0_471, __s0_471, 3, 2, 1, 0); \
  53217   uint16x8_t __rev1_471;  __rev1_471 = __builtin_shufflevector(__s1_471, __s1_471, 7, 6, 5, 4, 3, 2, 1, 0); \
  53218   uint16x4_t __rev2_471;  __rev2_471 = __builtin_shufflevector(__s2_471, __s2_471, 3, 2, 1, 0); \
  53219   __ret_471 = __rev0_471 + __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_471), __noswap_splat_lane_u16(__rev2_471, __p3_471)); \
  53220   __ret_471 = __builtin_shufflevector(__ret_471, __ret_471, 3, 2, 1, 0); \
  53221   __ret_471; \
  53222 })
  53223 #endif
  53224 
  53225 #ifdef __LITTLE_ENDIAN__
  53226 #define vmlal_high_lane_s32(__p0_472, __p1_472, __p2_472, __p3_472) __extension__ ({ \
  53227   int64x2_t __ret_472; \
  53228   int64x2_t __s0_472 = __p0_472; \
  53229   int32x4_t __s1_472 = __p1_472; \
  53230   int32x2_t __s2_472 = __p2_472; \
  53231   __ret_472 = __s0_472 + vmull_s32(vget_high_s32(__s1_472), splat_lane_s32(__s2_472, __p3_472)); \
  53232   __ret_472; \
  53233 })
  53234 #else
  53235 #define vmlal_high_lane_s32(__p0_473, __p1_473, __p2_473, __p3_473) __extension__ ({ \
  53236   int64x2_t __ret_473; \
  53237   int64x2_t __s0_473 = __p0_473; \
  53238   int32x4_t __s1_473 = __p1_473; \
  53239   int32x2_t __s2_473 = __p2_473; \
  53240   int64x2_t __rev0_473;  __rev0_473 = __builtin_shufflevector(__s0_473, __s0_473, 1, 0); \
  53241   int32x4_t __rev1_473;  __rev1_473 = __builtin_shufflevector(__s1_473, __s1_473, 3, 2, 1, 0); \
  53242   int32x2_t __rev2_473;  __rev2_473 = __builtin_shufflevector(__s2_473, __s2_473, 1, 0); \
  53243   __ret_473 = __rev0_473 + __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_473), __noswap_splat_lane_s32(__rev2_473, __p3_473)); \
  53244   __ret_473 = __builtin_shufflevector(__ret_473, __ret_473, 1, 0); \
  53245   __ret_473; \
  53246 })
  53247 #endif
  53248 
  53249 #ifdef __LITTLE_ENDIAN__
  53250 #define vmlal_high_lane_s16(__p0_474, __p1_474, __p2_474, __p3_474) __extension__ ({ \
  53251   int32x4_t __ret_474; \
  53252   int32x4_t __s0_474 = __p0_474; \
  53253   int16x8_t __s1_474 = __p1_474; \
  53254   int16x4_t __s2_474 = __p2_474; \
  53255   __ret_474 = __s0_474 + vmull_s16(vget_high_s16(__s1_474), splat_lane_s16(__s2_474, __p3_474)); \
  53256   __ret_474; \
  53257 })
  53258 #else
  53259 #define vmlal_high_lane_s16(__p0_475, __p1_475, __p2_475, __p3_475) __extension__ ({ \
  53260   int32x4_t __ret_475; \
  53261   int32x4_t __s0_475 = __p0_475; \
  53262   int16x8_t __s1_475 = __p1_475; \
  53263   int16x4_t __s2_475 = __p2_475; \
  53264   int32x4_t __rev0_475;  __rev0_475 = __builtin_shufflevector(__s0_475, __s0_475, 3, 2, 1, 0); \
  53265   int16x8_t __rev1_475;  __rev1_475 = __builtin_shufflevector(__s1_475, __s1_475, 7, 6, 5, 4, 3, 2, 1, 0); \
  53266   int16x4_t __rev2_475;  __rev2_475 = __builtin_shufflevector(__s2_475, __s2_475, 3, 2, 1, 0); \
  53267   __ret_475 = __rev0_475 + __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_475), __noswap_splat_lane_s16(__rev2_475, __p3_475)); \
  53268   __ret_475 = __builtin_shufflevector(__ret_475, __ret_475, 3, 2, 1, 0); \
  53269   __ret_475; \
  53270 })
  53271 #endif
  53272 
  53273 #ifdef __LITTLE_ENDIAN__
  53274 #define vmlal_high_laneq_u32(__p0_476, __p1_476, __p2_476, __p3_476) __extension__ ({ \
  53275   uint64x2_t __ret_476; \
  53276   uint64x2_t __s0_476 = __p0_476; \
  53277   uint32x4_t __s1_476 = __p1_476; \
  53278   uint32x4_t __s2_476 = __p2_476; \
  53279   __ret_476 = __s0_476 + vmull_u32(vget_high_u32(__s1_476), splat_laneq_u32(__s2_476, __p3_476)); \
  53280   __ret_476; \
  53281 })
  53282 #else
  53283 #define vmlal_high_laneq_u32(__p0_477, __p1_477, __p2_477, __p3_477) __extension__ ({ \
  53284   uint64x2_t __ret_477; \
  53285   uint64x2_t __s0_477 = __p0_477; \
  53286   uint32x4_t __s1_477 = __p1_477; \
  53287   uint32x4_t __s2_477 = __p2_477; \
  53288   uint64x2_t __rev0_477;  __rev0_477 = __builtin_shufflevector(__s0_477, __s0_477, 1, 0); \
  53289   uint32x4_t __rev1_477;  __rev1_477 = __builtin_shufflevector(__s1_477, __s1_477, 3, 2, 1, 0); \
  53290   uint32x4_t __rev2_477;  __rev2_477 = __builtin_shufflevector(__s2_477, __s2_477, 3, 2, 1, 0); \
  53291   __ret_477 = __rev0_477 + __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_477), __noswap_splat_laneq_u32(__rev2_477, __p3_477)); \
  53292   __ret_477 = __builtin_shufflevector(__ret_477, __ret_477, 1, 0); \
  53293   __ret_477; \
  53294 })
  53295 #endif
  53296 
  53297 #ifdef __LITTLE_ENDIAN__
  53298 #define vmlal_high_laneq_u16(__p0_478, __p1_478, __p2_478, __p3_478) __extension__ ({ \
  53299   uint32x4_t __ret_478; \
  53300   uint32x4_t __s0_478 = __p0_478; \
  53301   uint16x8_t __s1_478 = __p1_478; \
  53302   uint16x8_t __s2_478 = __p2_478; \
  53303   __ret_478 = __s0_478 + vmull_u16(vget_high_u16(__s1_478), splat_laneq_u16(__s2_478, __p3_478)); \
  53304   __ret_478; \
  53305 })
  53306 #else
  53307 #define vmlal_high_laneq_u16(__p0_479, __p1_479, __p2_479, __p3_479) __extension__ ({ \
  53308   uint32x4_t __ret_479; \
  53309   uint32x4_t __s0_479 = __p0_479; \
  53310   uint16x8_t __s1_479 = __p1_479; \
  53311   uint16x8_t __s2_479 = __p2_479; \
  53312   uint32x4_t __rev0_479;  __rev0_479 = __builtin_shufflevector(__s0_479, __s0_479, 3, 2, 1, 0); \
  53313   uint16x8_t __rev1_479;  __rev1_479 = __builtin_shufflevector(__s1_479, __s1_479, 7, 6, 5, 4, 3, 2, 1, 0); \
  53314   uint16x8_t __rev2_479;  __rev2_479 = __builtin_shufflevector(__s2_479, __s2_479, 7, 6, 5, 4, 3, 2, 1, 0); \
  53315   __ret_479 = __rev0_479 + __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_479), __noswap_splat_laneq_u16(__rev2_479, __p3_479)); \
  53316   __ret_479 = __builtin_shufflevector(__ret_479, __ret_479, 3, 2, 1, 0); \
  53317   __ret_479; \
  53318 })
  53319 #endif
  53320 
  53321 #ifdef __LITTLE_ENDIAN__
  53322 #define vmlal_high_laneq_s32(__p0_480, __p1_480, __p2_480, __p3_480) __extension__ ({ \
  53323   int64x2_t __ret_480; \
  53324   int64x2_t __s0_480 = __p0_480; \
  53325   int32x4_t __s1_480 = __p1_480; \
  53326   int32x4_t __s2_480 = __p2_480; \
  53327   __ret_480 = __s0_480 + vmull_s32(vget_high_s32(__s1_480), splat_laneq_s32(__s2_480, __p3_480)); \
  53328   __ret_480; \
  53329 })
  53330 #else
  53331 #define vmlal_high_laneq_s32(__p0_481, __p1_481, __p2_481, __p3_481) __extension__ ({ \
  53332   int64x2_t __ret_481; \
  53333   int64x2_t __s0_481 = __p0_481; \
  53334   int32x4_t __s1_481 = __p1_481; \
  53335   int32x4_t __s2_481 = __p2_481; \
  53336   int64x2_t __rev0_481;  __rev0_481 = __builtin_shufflevector(__s0_481, __s0_481, 1, 0); \
  53337   int32x4_t __rev1_481;  __rev1_481 = __builtin_shufflevector(__s1_481, __s1_481, 3, 2, 1, 0); \
  53338   int32x4_t __rev2_481;  __rev2_481 = __builtin_shufflevector(__s2_481, __s2_481, 3, 2, 1, 0); \
  53339   __ret_481 = __rev0_481 + __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_481), __noswap_splat_laneq_s32(__rev2_481, __p3_481)); \
  53340   __ret_481 = __builtin_shufflevector(__ret_481, __ret_481, 1, 0); \
  53341   __ret_481; \
  53342 })
  53343 #endif
  53344 
  53345 #ifdef __LITTLE_ENDIAN__
  53346 #define vmlal_high_laneq_s16(__p0_482, __p1_482, __p2_482, __p3_482) __extension__ ({ \
  53347   int32x4_t __ret_482; \
  53348   int32x4_t __s0_482 = __p0_482; \
  53349   int16x8_t __s1_482 = __p1_482; \
  53350   int16x8_t __s2_482 = __p2_482; \
  53351   __ret_482 = __s0_482 + vmull_s16(vget_high_s16(__s1_482), splat_laneq_s16(__s2_482, __p3_482)); \
  53352   __ret_482; \
  53353 })
  53354 #else
  53355 #define vmlal_high_laneq_s16(__p0_483, __p1_483, __p2_483, __p3_483) __extension__ ({ \
  53356   int32x4_t __ret_483; \
  53357   int32x4_t __s0_483 = __p0_483; \
  53358   int16x8_t __s1_483 = __p1_483; \
  53359   int16x8_t __s2_483 = __p2_483; \
  53360   int32x4_t __rev0_483;  __rev0_483 = __builtin_shufflevector(__s0_483, __s0_483, 3, 2, 1, 0); \
  53361   int16x8_t __rev1_483;  __rev1_483 = __builtin_shufflevector(__s1_483, __s1_483, 7, 6, 5, 4, 3, 2, 1, 0); \
  53362   int16x8_t __rev2_483;  __rev2_483 = __builtin_shufflevector(__s2_483, __s2_483, 7, 6, 5, 4, 3, 2, 1, 0); \
  53363   __ret_483 = __rev0_483 + __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_483), __noswap_splat_laneq_s16(__rev2_483, __p3_483)); \
  53364   __ret_483 = __builtin_shufflevector(__ret_483, __ret_483, 3, 2, 1, 0); \
  53365   __ret_483; \
  53366 })
  53367 #endif
  53368 
  53369 #ifdef __LITTLE_ENDIAN__
  53370 #define vmlal_laneq_u32(__p0_484, __p1_484, __p2_484, __p3_484) __extension__ ({ \
  53371   uint64x2_t __ret_484; \
  53372   uint64x2_t __s0_484 = __p0_484; \
  53373   uint32x2_t __s1_484 = __p1_484; \
  53374   uint32x4_t __s2_484 = __p2_484; \
  53375   __ret_484 = __s0_484 + vmull_u32(__s1_484, splat_laneq_u32(__s2_484, __p3_484)); \
  53376   __ret_484; \
  53377 })
  53378 #else
  53379 #define vmlal_laneq_u32(__p0_485, __p1_485, __p2_485, __p3_485) __extension__ ({ \
  53380   uint64x2_t __ret_485; \
  53381   uint64x2_t __s0_485 = __p0_485; \
  53382   uint32x2_t __s1_485 = __p1_485; \
  53383   uint32x4_t __s2_485 = __p2_485; \
  53384   uint64x2_t __rev0_485;  __rev0_485 = __builtin_shufflevector(__s0_485, __s0_485, 1, 0); \
  53385   uint32x2_t __rev1_485;  __rev1_485 = __builtin_shufflevector(__s1_485, __s1_485, 1, 0); \
  53386   uint32x4_t __rev2_485;  __rev2_485 = __builtin_shufflevector(__s2_485, __s2_485, 3, 2, 1, 0); \
  53387   __ret_485 = __rev0_485 + __noswap_vmull_u32(__rev1_485, __noswap_splat_laneq_u32(__rev2_485, __p3_485)); \
  53388   __ret_485 = __builtin_shufflevector(__ret_485, __ret_485, 1, 0); \
  53389   __ret_485; \
  53390 })
  53391 #endif
  53392 
  53393 #ifdef __LITTLE_ENDIAN__
  53394 #define vmlal_laneq_u16(__p0_486, __p1_486, __p2_486, __p3_486) __extension__ ({ \
  53395   uint32x4_t __ret_486; \
  53396   uint32x4_t __s0_486 = __p0_486; \
  53397   uint16x4_t __s1_486 = __p1_486; \
  53398   uint16x8_t __s2_486 = __p2_486; \
  53399   __ret_486 = __s0_486 + vmull_u16(__s1_486, splat_laneq_u16(__s2_486, __p3_486)); \
  53400   __ret_486; \
  53401 })
  53402 #else
  53403 #define vmlal_laneq_u16(__p0_487, __p1_487, __p2_487, __p3_487) __extension__ ({ \
  53404   uint32x4_t __ret_487; \
  53405   uint32x4_t __s0_487 = __p0_487; \
  53406   uint16x4_t __s1_487 = __p1_487; \
  53407   uint16x8_t __s2_487 = __p2_487; \
  53408   uint32x4_t __rev0_487;  __rev0_487 = __builtin_shufflevector(__s0_487, __s0_487, 3, 2, 1, 0); \
  53409   uint16x4_t __rev1_487;  __rev1_487 = __builtin_shufflevector(__s1_487, __s1_487, 3, 2, 1, 0); \
  53410   uint16x8_t __rev2_487;  __rev2_487 = __builtin_shufflevector(__s2_487, __s2_487, 7, 6, 5, 4, 3, 2, 1, 0); \
  53411   __ret_487 = __rev0_487 + __noswap_vmull_u16(__rev1_487, __noswap_splat_laneq_u16(__rev2_487, __p3_487)); \
  53412   __ret_487 = __builtin_shufflevector(__ret_487, __ret_487, 3, 2, 1, 0); \
  53413   __ret_487; \
  53414 })
  53415 #endif
  53416 
  53417 #ifdef __LITTLE_ENDIAN__
  53418 #define vmlal_laneq_s32(__p0_488, __p1_488, __p2_488, __p3_488) __extension__ ({ \
  53419   int64x2_t __ret_488; \
  53420   int64x2_t __s0_488 = __p0_488; \
  53421   int32x2_t __s1_488 = __p1_488; \
  53422   int32x4_t __s2_488 = __p2_488; \
  53423   __ret_488 = __s0_488 + vmull_s32(__s1_488, splat_laneq_s32(__s2_488, __p3_488)); \
  53424   __ret_488; \
  53425 })
  53426 #else
  53427 #define vmlal_laneq_s32(__p0_489, __p1_489, __p2_489, __p3_489) __extension__ ({ \
  53428   int64x2_t __ret_489; \
  53429   int64x2_t __s0_489 = __p0_489; \
  53430   int32x2_t __s1_489 = __p1_489; \
  53431   int32x4_t __s2_489 = __p2_489; \
  53432   int64x2_t __rev0_489;  __rev0_489 = __builtin_shufflevector(__s0_489, __s0_489, 1, 0); \
  53433   int32x2_t __rev1_489;  __rev1_489 = __builtin_shufflevector(__s1_489, __s1_489, 1, 0); \
  53434   int32x4_t __rev2_489;  __rev2_489 = __builtin_shufflevector(__s2_489, __s2_489, 3, 2, 1, 0); \
  53435   __ret_489 = __rev0_489 + __noswap_vmull_s32(__rev1_489, __noswap_splat_laneq_s32(__rev2_489, __p3_489)); \
  53436   __ret_489 = __builtin_shufflevector(__ret_489, __ret_489, 1, 0); \
  53437   __ret_489; \
  53438 })
  53439 #endif
  53440 
  53441 #ifdef __LITTLE_ENDIAN__
  53442 #define vmlal_laneq_s16(__p0_490, __p1_490, __p2_490, __p3_490) __extension__ ({ \
  53443   int32x4_t __ret_490; \
  53444   int32x4_t __s0_490 = __p0_490; \
  53445   int16x4_t __s1_490 = __p1_490; \
  53446   int16x8_t __s2_490 = __p2_490; \
  53447   __ret_490 = __s0_490 + vmull_s16(__s1_490, splat_laneq_s16(__s2_490, __p3_490)); \
  53448   __ret_490; \
  53449 })
  53450 #else
  53451 #define vmlal_laneq_s16(__p0_491, __p1_491, __p2_491, __p3_491) __extension__ ({ \
  53452   int32x4_t __ret_491; \
  53453   int32x4_t __s0_491 = __p0_491; \
  53454   int16x4_t __s1_491 = __p1_491; \
  53455   int16x8_t __s2_491 = __p2_491; \
  53456   int32x4_t __rev0_491;  __rev0_491 = __builtin_shufflevector(__s0_491, __s0_491, 3, 2, 1, 0); \
  53457   int16x4_t __rev1_491;  __rev1_491 = __builtin_shufflevector(__s1_491, __s1_491, 3, 2, 1, 0); \
  53458   int16x8_t __rev2_491;  __rev2_491 = __builtin_shufflevector(__s2_491, __s2_491, 7, 6, 5, 4, 3, 2, 1, 0); \
  53459   __ret_491 = __rev0_491 + __noswap_vmull_s16(__rev1_491, __noswap_splat_laneq_s16(__rev2_491, __p3_491)); \
  53460   __ret_491 = __builtin_shufflevector(__ret_491, __ret_491, 3, 2, 1, 0); \
  53461   __ret_491; \
  53462 })
  53463 #endif
  53464 
  53465 #ifdef __LITTLE_ENDIAN__
  53466 __ai __attribute__((target("neon"))) float64x2_t vmlsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  53467   float64x2_t __ret;
  53468   __ret = __p0 - __p1 * __p2;
  53469   return __ret;
  53470 }
  53471 #else
  53472 __ai __attribute__((target("neon"))) float64x2_t vmlsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  53473   float64x2_t __ret;
  53474   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  53475   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  53476   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  53477   __ret = __rev0 - __rev1 * __rev2;
  53478   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  53479   return __ret;
  53480 }
  53481 #endif
  53482 
  53483 __ai __attribute__((target("neon"))) float64x1_t vmls_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) {
  53484   float64x1_t __ret;
  53485   __ret = __p0 - __p1 * __p2;
  53486   return __ret;
  53487 }
  53488 #ifdef __LITTLE_ENDIAN__
  53489 #define vmlsq_laneq_u32(__p0_492, __p1_492, __p2_492, __p3_492) __extension__ ({ \
  53490   uint32x4_t __ret_492; \
  53491   uint32x4_t __s0_492 = __p0_492; \
  53492   uint32x4_t __s1_492 = __p1_492; \
  53493   uint32x4_t __s2_492 = __p2_492; \
  53494   __ret_492 = __s0_492 - __s1_492 * splatq_laneq_u32(__s2_492, __p3_492); \
  53495   __ret_492; \
  53496 })
  53497 #else
  53498 #define vmlsq_laneq_u32(__p0_493, __p1_493, __p2_493, __p3_493) __extension__ ({ \
  53499   uint32x4_t __ret_493; \
  53500   uint32x4_t __s0_493 = __p0_493; \
  53501   uint32x4_t __s1_493 = __p1_493; \
  53502   uint32x4_t __s2_493 = __p2_493; \
  53503   uint32x4_t __rev0_493;  __rev0_493 = __builtin_shufflevector(__s0_493, __s0_493, 3, 2, 1, 0); \
  53504   uint32x4_t __rev1_493;  __rev1_493 = __builtin_shufflevector(__s1_493, __s1_493, 3, 2, 1, 0); \
  53505   uint32x4_t __rev2_493;  __rev2_493 = __builtin_shufflevector(__s2_493, __s2_493, 3, 2, 1, 0); \
  53506   __ret_493 = __rev0_493 - __rev1_493 * __noswap_splatq_laneq_u32(__rev2_493, __p3_493); \
  53507   __ret_493 = __builtin_shufflevector(__ret_493, __ret_493, 3, 2, 1, 0); \
  53508   __ret_493; \
  53509 })
  53510 #endif
  53511 
  53512 #ifdef __LITTLE_ENDIAN__
  53513 #define vmlsq_laneq_u16(__p0_494, __p1_494, __p2_494, __p3_494) __extension__ ({ \
  53514   uint16x8_t __ret_494; \
  53515   uint16x8_t __s0_494 = __p0_494; \
  53516   uint16x8_t __s1_494 = __p1_494; \
  53517   uint16x8_t __s2_494 = __p2_494; \
  53518   __ret_494 = __s0_494 - __s1_494 * splatq_laneq_u16(__s2_494, __p3_494); \
  53519   __ret_494; \
  53520 })
  53521 #else
  53522 #define vmlsq_laneq_u16(__p0_495, __p1_495, __p2_495, __p3_495) __extension__ ({ \
  53523   uint16x8_t __ret_495; \
  53524   uint16x8_t __s0_495 = __p0_495; \
  53525   uint16x8_t __s1_495 = __p1_495; \
  53526   uint16x8_t __s2_495 = __p2_495; \
  53527   uint16x8_t __rev0_495;  __rev0_495 = __builtin_shufflevector(__s0_495, __s0_495, 7, 6, 5, 4, 3, 2, 1, 0); \
  53528   uint16x8_t __rev1_495;  __rev1_495 = __builtin_shufflevector(__s1_495, __s1_495, 7, 6, 5, 4, 3, 2, 1, 0); \
  53529   uint16x8_t __rev2_495;  __rev2_495 = __builtin_shufflevector(__s2_495, __s2_495, 7, 6, 5, 4, 3, 2, 1, 0); \
  53530   __ret_495 = __rev0_495 - __rev1_495 * __noswap_splatq_laneq_u16(__rev2_495, __p3_495); \
  53531   __ret_495 = __builtin_shufflevector(__ret_495, __ret_495, 7, 6, 5, 4, 3, 2, 1, 0); \
  53532   __ret_495; \
  53533 })
  53534 #endif
  53535 
  53536 #ifdef __LITTLE_ENDIAN__
  53537 #define vmlsq_laneq_f32(__p0_496, __p1_496, __p2_496, __p3_496) __extension__ ({ \
  53538   float32x4_t __ret_496; \
  53539   float32x4_t __s0_496 = __p0_496; \
  53540   float32x4_t __s1_496 = __p1_496; \
  53541   float32x4_t __s2_496 = __p2_496; \
  53542   __ret_496 = __s0_496 - __s1_496 * splatq_laneq_f32(__s2_496, __p3_496); \
  53543   __ret_496; \
  53544 })
  53545 #else
  53546 #define vmlsq_laneq_f32(__p0_497, __p1_497, __p2_497, __p3_497) __extension__ ({ \
  53547   float32x4_t __ret_497; \
  53548   float32x4_t __s0_497 = __p0_497; \
  53549   float32x4_t __s1_497 = __p1_497; \
  53550   float32x4_t __s2_497 = __p2_497; \
  53551   float32x4_t __rev0_497;  __rev0_497 = __builtin_shufflevector(__s0_497, __s0_497, 3, 2, 1, 0); \
  53552   float32x4_t __rev1_497;  __rev1_497 = __builtin_shufflevector(__s1_497, __s1_497, 3, 2, 1, 0); \
  53553   float32x4_t __rev2_497;  __rev2_497 = __builtin_shufflevector(__s2_497, __s2_497, 3, 2, 1, 0); \
  53554   __ret_497 = __rev0_497 - __rev1_497 * __noswap_splatq_laneq_f32(__rev2_497, __p3_497); \
  53555   __ret_497 = __builtin_shufflevector(__ret_497, __ret_497, 3, 2, 1, 0); \
  53556   __ret_497; \
  53557 })
  53558 #endif
  53559 
  53560 #ifdef __LITTLE_ENDIAN__
  53561 #define vmlsq_laneq_s32(__p0_498, __p1_498, __p2_498, __p3_498) __extension__ ({ \
  53562   int32x4_t __ret_498; \
  53563   int32x4_t __s0_498 = __p0_498; \
  53564   int32x4_t __s1_498 = __p1_498; \
  53565   int32x4_t __s2_498 = __p2_498; \
  53566   __ret_498 = __s0_498 - __s1_498 * splatq_laneq_s32(__s2_498, __p3_498); \
  53567   __ret_498; \
  53568 })
  53569 #else
  53570 #define vmlsq_laneq_s32(__p0_499, __p1_499, __p2_499, __p3_499) __extension__ ({ \
  53571   int32x4_t __ret_499; \
  53572   int32x4_t __s0_499 = __p0_499; \
  53573   int32x4_t __s1_499 = __p1_499; \
  53574   int32x4_t __s2_499 = __p2_499; \
  53575   int32x4_t __rev0_499;  __rev0_499 = __builtin_shufflevector(__s0_499, __s0_499, 3, 2, 1, 0); \
  53576   int32x4_t __rev1_499;  __rev1_499 = __builtin_shufflevector(__s1_499, __s1_499, 3, 2, 1, 0); \
  53577   int32x4_t __rev2_499;  __rev2_499 = __builtin_shufflevector(__s2_499, __s2_499, 3, 2, 1, 0); \
  53578   __ret_499 = __rev0_499 - __rev1_499 * __noswap_splatq_laneq_s32(__rev2_499, __p3_499); \
  53579   __ret_499 = __builtin_shufflevector(__ret_499, __ret_499, 3, 2, 1, 0); \
  53580   __ret_499; \
  53581 })
  53582 #endif
  53583 
  53584 #ifdef __LITTLE_ENDIAN__
  53585 #define vmlsq_laneq_s16(__p0_500, __p1_500, __p2_500, __p3_500) __extension__ ({ \
  53586   int16x8_t __ret_500; \
  53587   int16x8_t __s0_500 = __p0_500; \
  53588   int16x8_t __s1_500 = __p1_500; \
  53589   int16x8_t __s2_500 = __p2_500; \
  53590   __ret_500 = __s0_500 - __s1_500 * splatq_laneq_s16(__s2_500, __p3_500); \
  53591   __ret_500; \
  53592 })
  53593 #else
  53594 #define vmlsq_laneq_s16(__p0_501, __p1_501, __p2_501, __p3_501) __extension__ ({ \
  53595   int16x8_t __ret_501; \
  53596   int16x8_t __s0_501 = __p0_501; \
  53597   int16x8_t __s1_501 = __p1_501; \
  53598   int16x8_t __s2_501 = __p2_501; \
  53599   int16x8_t __rev0_501;  __rev0_501 = __builtin_shufflevector(__s0_501, __s0_501, 7, 6, 5, 4, 3, 2, 1, 0); \
  53600   int16x8_t __rev1_501;  __rev1_501 = __builtin_shufflevector(__s1_501, __s1_501, 7, 6, 5, 4, 3, 2, 1, 0); \
  53601   int16x8_t __rev2_501;  __rev2_501 = __builtin_shufflevector(__s2_501, __s2_501, 7, 6, 5, 4, 3, 2, 1, 0); \
  53602   __ret_501 = __rev0_501 - __rev1_501 * __noswap_splatq_laneq_s16(__rev2_501, __p3_501); \
  53603   __ret_501 = __builtin_shufflevector(__ret_501, __ret_501, 7, 6, 5, 4, 3, 2, 1, 0); \
  53604   __ret_501; \
  53605 })
  53606 #endif
  53607 
  53608 #ifdef __LITTLE_ENDIAN__
  53609 #define vmls_laneq_u32(__p0_502, __p1_502, __p2_502, __p3_502) __extension__ ({ \
  53610   uint32x2_t __ret_502; \
  53611   uint32x2_t __s0_502 = __p0_502; \
  53612   uint32x2_t __s1_502 = __p1_502; \
  53613   uint32x4_t __s2_502 = __p2_502; \
  53614   __ret_502 = __s0_502 - __s1_502 * splat_laneq_u32(__s2_502, __p3_502); \
  53615   __ret_502; \
  53616 })
  53617 #else
  53618 #define vmls_laneq_u32(__p0_503, __p1_503, __p2_503, __p3_503) __extension__ ({ \
  53619   uint32x2_t __ret_503; \
  53620   uint32x2_t __s0_503 = __p0_503; \
  53621   uint32x2_t __s1_503 = __p1_503; \
  53622   uint32x4_t __s2_503 = __p2_503; \
  53623   uint32x2_t __rev0_503;  __rev0_503 = __builtin_shufflevector(__s0_503, __s0_503, 1, 0); \
  53624   uint32x2_t __rev1_503;  __rev1_503 = __builtin_shufflevector(__s1_503, __s1_503, 1, 0); \
  53625   uint32x4_t __rev2_503;  __rev2_503 = __builtin_shufflevector(__s2_503, __s2_503, 3, 2, 1, 0); \
  53626   __ret_503 = __rev0_503 - __rev1_503 * __noswap_splat_laneq_u32(__rev2_503, __p3_503); \
  53627   __ret_503 = __builtin_shufflevector(__ret_503, __ret_503, 1, 0); \
  53628   __ret_503; \
  53629 })
  53630 #endif
  53631 
  53632 #ifdef __LITTLE_ENDIAN__
  53633 #define vmls_laneq_u16(__p0_504, __p1_504, __p2_504, __p3_504) __extension__ ({ \
  53634   uint16x4_t __ret_504; \
  53635   uint16x4_t __s0_504 = __p0_504; \
  53636   uint16x4_t __s1_504 = __p1_504; \
  53637   uint16x8_t __s2_504 = __p2_504; \
  53638   __ret_504 = __s0_504 - __s1_504 * splat_laneq_u16(__s2_504, __p3_504); \
  53639   __ret_504; \
  53640 })
  53641 #else
  53642 #define vmls_laneq_u16(__p0_505, __p1_505, __p2_505, __p3_505) __extension__ ({ \
  53643   uint16x4_t __ret_505; \
  53644   uint16x4_t __s0_505 = __p0_505; \
  53645   uint16x4_t __s1_505 = __p1_505; \
  53646   uint16x8_t __s2_505 = __p2_505; \
  53647   uint16x4_t __rev0_505;  __rev0_505 = __builtin_shufflevector(__s0_505, __s0_505, 3, 2, 1, 0); \
  53648   uint16x4_t __rev1_505;  __rev1_505 = __builtin_shufflevector(__s1_505, __s1_505, 3, 2, 1, 0); \
  53649   uint16x8_t __rev2_505;  __rev2_505 = __builtin_shufflevector(__s2_505, __s2_505, 7, 6, 5, 4, 3, 2, 1, 0); \
  53650   __ret_505 = __rev0_505 - __rev1_505 * __noswap_splat_laneq_u16(__rev2_505, __p3_505); \
  53651   __ret_505 = __builtin_shufflevector(__ret_505, __ret_505, 3, 2, 1, 0); \
  53652   __ret_505; \
  53653 })
  53654 #endif
  53655 
  53656 #ifdef __LITTLE_ENDIAN__
  53657 #define vmls_laneq_f32(__p0_506, __p1_506, __p2_506, __p3_506) __extension__ ({ \
  53658   float32x2_t __ret_506; \
  53659   float32x2_t __s0_506 = __p0_506; \
  53660   float32x2_t __s1_506 = __p1_506; \
  53661   float32x4_t __s2_506 = __p2_506; \
  53662   __ret_506 = __s0_506 - __s1_506 * splat_laneq_f32(__s2_506, __p3_506); \
  53663   __ret_506; \
  53664 })
  53665 #else
  53666 #define vmls_laneq_f32(__p0_507, __p1_507, __p2_507, __p3_507) __extension__ ({ \
  53667   float32x2_t __ret_507; \
  53668   float32x2_t __s0_507 = __p0_507; \
  53669   float32x2_t __s1_507 = __p1_507; \
  53670   float32x4_t __s2_507 = __p2_507; \
  53671   float32x2_t __rev0_507;  __rev0_507 = __builtin_shufflevector(__s0_507, __s0_507, 1, 0); \
  53672   float32x2_t __rev1_507;  __rev1_507 = __builtin_shufflevector(__s1_507, __s1_507, 1, 0); \
  53673   float32x4_t __rev2_507;  __rev2_507 = __builtin_shufflevector(__s2_507, __s2_507, 3, 2, 1, 0); \
  53674   __ret_507 = __rev0_507 - __rev1_507 * __noswap_splat_laneq_f32(__rev2_507, __p3_507); \
  53675   __ret_507 = __builtin_shufflevector(__ret_507, __ret_507, 1, 0); \
  53676   __ret_507; \
  53677 })
  53678 #endif
  53679 
  53680 #ifdef __LITTLE_ENDIAN__
  53681 #define vmls_laneq_s32(__p0_508, __p1_508, __p2_508, __p3_508) __extension__ ({ \
  53682   int32x2_t __ret_508; \
  53683   int32x2_t __s0_508 = __p0_508; \
  53684   int32x2_t __s1_508 = __p1_508; \
  53685   int32x4_t __s2_508 = __p2_508; \
  53686   __ret_508 = __s0_508 - __s1_508 * splat_laneq_s32(__s2_508, __p3_508); \
  53687   __ret_508; \
  53688 })
  53689 #else
  53690 #define vmls_laneq_s32(__p0_509, __p1_509, __p2_509, __p3_509) __extension__ ({ \
  53691   int32x2_t __ret_509; \
  53692   int32x2_t __s0_509 = __p0_509; \
  53693   int32x2_t __s1_509 = __p1_509; \
  53694   int32x4_t __s2_509 = __p2_509; \
  53695   int32x2_t __rev0_509;  __rev0_509 = __builtin_shufflevector(__s0_509, __s0_509, 1, 0); \
  53696   int32x2_t __rev1_509;  __rev1_509 = __builtin_shufflevector(__s1_509, __s1_509, 1, 0); \
  53697   int32x4_t __rev2_509;  __rev2_509 = __builtin_shufflevector(__s2_509, __s2_509, 3, 2, 1, 0); \
  53698   __ret_509 = __rev0_509 - __rev1_509 * __noswap_splat_laneq_s32(__rev2_509, __p3_509); \
  53699   __ret_509 = __builtin_shufflevector(__ret_509, __ret_509, 1, 0); \
  53700   __ret_509; \
  53701 })
  53702 #endif
  53703 
  53704 #ifdef __LITTLE_ENDIAN__
  53705 #define vmls_laneq_s16(__p0_510, __p1_510, __p2_510, __p3_510) __extension__ ({ \
  53706   int16x4_t __ret_510; \
  53707   int16x4_t __s0_510 = __p0_510; \
  53708   int16x4_t __s1_510 = __p1_510; \
  53709   int16x8_t __s2_510 = __p2_510; \
  53710   __ret_510 = __s0_510 - __s1_510 * splat_laneq_s16(__s2_510, __p3_510); \
  53711   __ret_510; \
  53712 })
  53713 #else
  53714 #define vmls_laneq_s16(__p0_511, __p1_511, __p2_511, __p3_511) __extension__ ({ \
  53715   int16x4_t __ret_511; \
  53716   int16x4_t __s0_511 = __p0_511; \
  53717   int16x4_t __s1_511 = __p1_511; \
  53718   int16x8_t __s2_511 = __p2_511; \
  53719   int16x4_t __rev0_511;  __rev0_511 = __builtin_shufflevector(__s0_511, __s0_511, 3, 2, 1, 0); \
  53720   int16x4_t __rev1_511;  __rev1_511 = __builtin_shufflevector(__s1_511, __s1_511, 3, 2, 1, 0); \
  53721   int16x8_t __rev2_511;  __rev2_511 = __builtin_shufflevector(__s2_511, __s2_511, 7, 6, 5, 4, 3, 2, 1, 0); \
  53722   __ret_511 = __rev0_511 - __rev1_511 * __noswap_splat_laneq_s16(__rev2_511, __p3_511); \
  53723   __ret_511 = __builtin_shufflevector(__ret_511, __ret_511, 3, 2, 1, 0); \
  53724   __ret_511; \
  53725 })
  53726 #endif
  53727 
  53728 #ifdef __LITTLE_ENDIAN__
  53729 #define vmlsl_high_lane_u32(__p0_512, __p1_512, __p2_512, __p3_512) __extension__ ({ \
  53730   uint64x2_t __ret_512; \
  53731   uint64x2_t __s0_512 = __p0_512; \
  53732   uint32x4_t __s1_512 = __p1_512; \
  53733   uint32x2_t __s2_512 = __p2_512; \
  53734   __ret_512 = __s0_512 - vmull_u32(vget_high_u32(__s1_512), splat_lane_u32(__s2_512, __p3_512)); \
  53735   __ret_512; \
  53736 })
  53737 #else
  53738 #define vmlsl_high_lane_u32(__p0_513, __p1_513, __p2_513, __p3_513) __extension__ ({ \
  53739   uint64x2_t __ret_513; \
  53740   uint64x2_t __s0_513 = __p0_513; \
  53741   uint32x4_t __s1_513 = __p1_513; \
  53742   uint32x2_t __s2_513 = __p2_513; \
  53743   uint64x2_t __rev0_513;  __rev0_513 = __builtin_shufflevector(__s0_513, __s0_513, 1, 0); \
  53744   uint32x4_t __rev1_513;  __rev1_513 = __builtin_shufflevector(__s1_513, __s1_513, 3, 2, 1, 0); \
  53745   uint32x2_t __rev2_513;  __rev2_513 = __builtin_shufflevector(__s2_513, __s2_513, 1, 0); \
  53746   __ret_513 = __rev0_513 - __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_513), __noswap_splat_lane_u32(__rev2_513, __p3_513)); \
  53747   __ret_513 = __builtin_shufflevector(__ret_513, __ret_513, 1, 0); \
  53748   __ret_513; \
  53749 })
  53750 #endif
  53751 
  53752 #ifdef __LITTLE_ENDIAN__
  53753 #define vmlsl_high_lane_u16(__p0_514, __p1_514, __p2_514, __p3_514) __extension__ ({ \
  53754   uint32x4_t __ret_514; \
  53755   uint32x4_t __s0_514 = __p0_514; \
  53756   uint16x8_t __s1_514 = __p1_514; \
  53757   uint16x4_t __s2_514 = __p2_514; \
  53758   __ret_514 = __s0_514 - vmull_u16(vget_high_u16(__s1_514), splat_lane_u16(__s2_514, __p3_514)); \
  53759   __ret_514; \
  53760 })
  53761 #else
  53762 #define vmlsl_high_lane_u16(__p0_515, __p1_515, __p2_515, __p3_515) __extension__ ({ \
  53763   uint32x4_t __ret_515; \
  53764   uint32x4_t __s0_515 = __p0_515; \
  53765   uint16x8_t __s1_515 = __p1_515; \
  53766   uint16x4_t __s2_515 = __p2_515; \
  53767   uint32x4_t __rev0_515;  __rev0_515 = __builtin_shufflevector(__s0_515, __s0_515, 3, 2, 1, 0); \
  53768   uint16x8_t __rev1_515;  __rev1_515 = __builtin_shufflevector(__s1_515, __s1_515, 7, 6, 5, 4, 3, 2, 1, 0); \
  53769   uint16x4_t __rev2_515;  __rev2_515 = __builtin_shufflevector(__s2_515, __s2_515, 3, 2, 1, 0); \
  53770   __ret_515 = __rev0_515 - __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_515), __noswap_splat_lane_u16(__rev2_515, __p3_515)); \
  53771   __ret_515 = __builtin_shufflevector(__ret_515, __ret_515, 3, 2, 1, 0); \
  53772   __ret_515; \
  53773 })
  53774 #endif
  53775 
  53776 #ifdef __LITTLE_ENDIAN__
  53777 #define vmlsl_high_lane_s32(__p0_516, __p1_516, __p2_516, __p3_516) __extension__ ({ \
  53778   int64x2_t __ret_516; \
  53779   int64x2_t __s0_516 = __p0_516; \
  53780   int32x4_t __s1_516 = __p1_516; \
  53781   int32x2_t __s2_516 = __p2_516; \
  53782   __ret_516 = __s0_516 - vmull_s32(vget_high_s32(__s1_516), splat_lane_s32(__s2_516, __p3_516)); \
  53783   __ret_516; \
  53784 })
  53785 #else
  53786 #define vmlsl_high_lane_s32(__p0_517, __p1_517, __p2_517, __p3_517) __extension__ ({ \
  53787   int64x2_t __ret_517; \
  53788   int64x2_t __s0_517 = __p0_517; \
  53789   int32x4_t __s1_517 = __p1_517; \
  53790   int32x2_t __s2_517 = __p2_517; \
  53791   int64x2_t __rev0_517;  __rev0_517 = __builtin_shufflevector(__s0_517, __s0_517, 1, 0); \
  53792   int32x4_t __rev1_517;  __rev1_517 = __builtin_shufflevector(__s1_517, __s1_517, 3, 2, 1, 0); \
  53793   int32x2_t __rev2_517;  __rev2_517 = __builtin_shufflevector(__s2_517, __s2_517, 1, 0); \
  53794   __ret_517 = __rev0_517 - __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_517), __noswap_splat_lane_s32(__rev2_517, __p3_517)); \
  53795   __ret_517 = __builtin_shufflevector(__ret_517, __ret_517, 1, 0); \
  53796   __ret_517; \
  53797 })
  53798 #endif
  53799 
  53800 #ifdef __LITTLE_ENDIAN__
  53801 #define vmlsl_high_lane_s16(__p0_518, __p1_518, __p2_518, __p3_518) __extension__ ({ \
  53802   int32x4_t __ret_518; \
  53803   int32x4_t __s0_518 = __p0_518; \
  53804   int16x8_t __s1_518 = __p1_518; \
  53805   int16x4_t __s2_518 = __p2_518; \
  53806   __ret_518 = __s0_518 - vmull_s16(vget_high_s16(__s1_518), splat_lane_s16(__s2_518, __p3_518)); \
  53807   __ret_518; \
  53808 })
  53809 #else
  53810 #define vmlsl_high_lane_s16(__p0_519, __p1_519, __p2_519, __p3_519) __extension__ ({ \
  53811   int32x4_t __ret_519; \
  53812   int32x4_t __s0_519 = __p0_519; \
  53813   int16x8_t __s1_519 = __p1_519; \
  53814   int16x4_t __s2_519 = __p2_519; \
  53815   int32x4_t __rev0_519;  __rev0_519 = __builtin_shufflevector(__s0_519, __s0_519, 3, 2, 1, 0); \
  53816   int16x8_t __rev1_519;  __rev1_519 = __builtin_shufflevector(__s1_519, __s1_519, 7, 6, 5, 4, 3, 2, 1, 0); \
  53817   int16x4_t __rev2_519;  __rev2_519 = __builtin_shufflevector(__s2_519, __s2_519, 3, 2, 1, 0); \
  53818   __ret_519 = __rev0_519 - __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_519), __noswap_splat_lane_s16(__rev2_519, __p3_519)); \
  53819   __ret_519 = __builtin_shufflevector(__ret_519, __ret_519, 3, 2, 1, 0); \
  53820   __ret_519; \
  53821 })
  53822 #endif
  53823 
  53824 #ifdef __LITTLE_ENDIAN__
  53825 #define vmlsl_high_laneq_u32(__p0_520, __p1_520, __p2_520, __p3_520) __extension__ ({ \
  53826   uint64x2_t __ret_520; \
  53827   uint64x2_t __s0_520 = __p0_520; \
  53828   uint32x4_t __s1_520 = __p1_520; \
  53829   uint32x4_t __s2_520 = __p2_520; \
  53830   __ret_520 = __s0_520 - vmull_u32(vget_high_u32(__s1_520), splat_laneq_u32(__s2_520, __p3_520)); \
  53831   __ret_520; \
  53832 })
  53833 #else
  53834 #define vmlsl_high_laneq_u32(__p0_521, __p1_521, __p2_521, __p3_521) __extension__ ({ \
  53835   uint64x2_t __ret_521; \
  53836   uint64x2_t __s0_521 = __p0_521; \
  53837   uint32x4_t __s1_521 = __p1_521; \
  53838   uint32x4_t __s2_521 = __p2_521; \
  53839   uint64x2_t __rev0_521;  __rev0_521 = __builtin_shufflevector(__s0_521, __s0_521, 1, 0); \
  53840   uint32x4_t __rev1_521;  __rev1_521 = __builtin_shufflevector(__s1_521, __s1_521, 3, 2, 1, 0); \
  53841   uint32x4_t __rev2_521;  __rev2_521 = __builtin_shufflevector(__s2_521, __s2_521, 3, 2, 1, 0); \
  53842   __ret_521 = __rev0_521 - __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_521), __noswap_splat_laneq_u32(__rev2_521, __p3_521)); \
  53843   __ret_521 = __builtin_shufflevector(__ret_521, __ret_521, 1, 0); \
  53844   __ret_521; \
  53845 })
  53846 #endif
  53847 
  53848 #ifdef __LITTLE_ENDIAN__
  53849 #define vmlsl_high_laneq_u16(__p0_522, __p1_522, __p2_522, __p3_522) __extension__ ({ \
  53850   uint32x4_t __ret_522; \
  53851   uint32x4_t __s0_522 = __p0_522; \
  53852   uint16x8_t __s1_522 = __p1_522; \
  53853   uint16x8_t __s2_522 = __p2_522; \
  53854   __ret_522 = __s0_522 - vmull_u16(vget_high_u16(__s1_522), splat_laneq_u16(__s2_522, __p3_522)); \
  53855   __ret_522; \
  53856 })
  53857 #else
  53858 #define vmlsl_high_laneq_u16(__p0_523, __p1_523, __p2_523, __p3_523) __extension__ ({ \
  53859   uint32x4_t __ret_523; \
  53860   uint32x4_t __s0_523 = __p0_523; \
  53861   uint16x8_t __s1_523 = __p1_523; \
  53862   uint16x8_t __s2_523 = __p2_523; \
  53863   uint32x4_t __rev0_523;  __rev0_523 = __builtin_shufflevector(__s0_523, __s0_523, 3, 2, 1, 0); \
  53864   uint16x8_t __rev1_523;  __rev1_523 = __builtin_shufflevector(__s1_523, __s1_523, 7, 6, 5, 4, 3, 2, 1, 0); \
  53865   uint16x8_t __rev2_523;  __rev2_523 = __builtin_shufflevector(__s2_523, __s2_523, 7, 6, 5, 4, 3, 2, 1, 0); \
  53866   __ret_523 = __rev0_523 - __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_523), __noswap_splat_laneq_u16(__rev2_523, __p3_523)); \
  53867   __ret_523 = __builtin_shufflevector(__ret_523, __ret_523, 3, 2, 1, 0); \
  53868   __ret_523; \
  53869 })
  53870 #endif
  53871 
  53872 #ifdef __LITTLE_ENDIAN__
  53873 #define vmlsl_high_laneq_s32(__p0_524, __p1_524, __p2_524, __p3_524) __extension__ ({ \
  53874   int64x2_t __ret_524; \
  53875   int64x2_t __s0_524 = __p0_524; \
  53876   int32x4_t __s1_524 = __p1_524; \
  53877   int32x4_t __s2_524 = __p2_524; \
  53878   __ret_524 = __s0_524 - vmull_s32(vget_high_s32(__s1_524), splat_laneq_s32(__s2_524, __p3_524)); \
  53879   __ret_524; \
  53880 })
  53881 #else
  53882 #define vmlsl_high_laneq_s32(__p0_525, __p1_525, __p2_525, __p3_525) __extension__ ({ \
  53883   int64x2_t __ret_525; \
  53884   int64x2_t __s0_525 = __p0_525; \
  53885   int32x4_t __s1_525 = __p1_525; \
  53886   int32x4_t __s2_525 = __p2_525; \
  53887   int64x2_t __rev0_525;  __rev0_525 = __builtin_shufflevector(__s0_525, __s0_525, 1, 0); \
  53888   int32x4_t __rev1_525;  __rev1_525 = __builtin_shufflevector(__s1_525, __s1_525, 3, 2, 1, 0); \
  53889   int32x4_t __rev2_525;  __rev2_525 = __builtin_shufflevector(__s2_525, __s2_525, 3, 2, 1, 0); \
  53890   __ret_525 = __rev0_525 - __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_525), __noswap_splat_laneq_s32(__rev2_525, __p3_525)); \
  53891   __ret_525 = __builtin_shufflevector(__ret_525, __ret_525, 1, 0); \
  53892   __ret_525; \
  53893 })
  53894 #endif
  53895 
  53896 #ifdef __LITTLE_ENDIAN__
  53897 #define vmlsl_high_laneq_s16(__p0_526, __p1_526, __p2_526, __p3_526) __extension__ ({ \
  53898   int32x4_t __ret_526; \
  53899   int32x4_t __s0_526 = __p0_526; \
  53900   int16x8_t __s1_526 = __p1_526; \
  53901   int16x8_t __s2_526 = __p2_526; \
  53902   __ret_526 = __s0_526 - vmull_s16(vget_high_s16(__s1_526), splat_laneq_s16(__s2_526, __p3_526)); \
  53903   __ret_526; \
  53904 })
  53905 #else
  53906 #define vmlsl_high_laneq_s16(__p0_527, __p1_527, __p2_527, __p3_527) __extension__ ({ \
  53907   int32x4_t __ret_527; \
  53908   int32x4_t __s0_527 = __p0_527; \
  53909   int16x8_t __s1_527 = __p1_527; \
  53910   int16x8_t __s2_527 = __p2_527; \
  53911   int32x4_t __rev0_527;  __rev0_527 = __builtin_shufflevector(__s0_527, __s0_527, 3, 2, 1, 0); \
  53912   int16x8_t __rev1_527;  __rev1_527 = __builtin_shufflevector(__s1_527, __s1_527, 7, 6, 5, 4, 3, 2, 1, 0); \
  53913   int16x8_t __rev2_527;  __rev2_527 = __builtin_shufflevector(__s2_527, __s2_527, 7, 6, 5, 4, 3, 2, 1, 0); \
  53914   __ret_527 = __rev0_527 - __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_527), __noswap_splat_laneq_s16(__rev2_527, __p3_527)); \
  53915   __ret_527 = __builtin_shufflevector(__ret_527, __ret_527, 3, 2, 1, 0); \
  53916   __ret_527; \
  53917 })
  53918 #endif
  53919 
  53920 #ifdef __LITTLE_ENDIAN__
  53921 #define vmlsl_laneq_u32(__p0_528, __p1_528, __p2_528, __p3_528) __extension__ ({ \
  53922   uint64x2_t __ret_528; \
  53923   uint64x2_t __s0_528 = __p0_528; \
  53924   uint32x2_t __s1_528 = __p1_528; \
  53925   uint32x4_t __s2_528 = __p2_528; \
  53926   __ret_528 = __s0_528 - vmull_u32(__s1_528, splat_laneq_u32(__s2_528, __p3_528)); \
  53927   __ret_528; \
  53928 })
  53929 #else
  53930 #define vmlsl_laneq_u32(__p0_529, __p1_529, __p2_529, __p3_529) __extension__ ({ \
  53931   uint64x2_t __ret_529; \
  53932   uint64x2_t __s0_529 = __p0_529; \
  53933   uint32x2_t __s1_529 = __p1_529; \
  53934   uint32x4_t __s2_529 = __p2_529; \
  53935   uint64x2_t __rev0_529;  __rev0_529 = __builtin_shufflevector(__s0_529, __s0_529, 1, 0); \
  53936   uint32x2_t __rev1_529;  __rev1_529 = __builtin_shufflevector(__s1_529, __s1_529, 1, 0); \
  53937   uint32x4_t __rev2_529;  __rev2_529 = __builtin_shufflevector(__s2_529, __s2_529, 3, 2, 1, 0); \
  53938   __ret_529 = __rev0_529 - __noswap_vmull_u32(__rev1_529, __noswap_splat_laneq_u32(__rev2_529, __p3_529)); \
  53939   __ret_529 = __builtin_shufflevector(__ret_529, __ret_529, 1, 0); \
  53940   __ret_529; \
  53941 })
  53942 #endif
  53943 
  53944 #ifdef __LITTLE_ENDIAN__
  53945 #define vmlsl_laneq_u16(__p0_530, __p1_530, __p2_530, __p3_530) __extension__ ({ \
  53946   uint32x4_t __ret_530; \
  53947   uint32x4_t __s0_530 = __p0_530; \
  53948   uint16x4_t __s1_530 = __p1_530; \
  53949   uint16x8_t __s2_530 = __p2_530; \
  53950   __ret_530 = __s0_530 - vmull_u16(__s1_530, splat_laneq_u16(__s2_530, __p3_530)); \
  53951   __ret_530; \
  53952 })
  53953 #else
  53954 #define vmlsl_laneq_u16(__p0_531, __p1_531, __p2_531, __p3_531) __extension__ ({ \
  53955   uint32x4_t __ret_531; \
  53956   uint32x4_t __s0_531 = __p0_531; \
  53957   uint16x4_t __s1_531 = __p1_531; \
  53958   uint16x8_t __s2_531 = __p2_531; \
  53959   uint32x4_t __rev0_531;  __rev0_531 = __builtin_shufflevector(__s0_531, __s0_531, 3, 2, 1, 0); \
  53960   uint16x4_t __rev1_531;  __rev1_531 = __builtin_shufflevector(__s1_531, __s1_531, 3, 2, 1, 0); \
  53961   uint16x8_t __rev2_531;  __rev2_531 = __builtin_shufflevector(__s2_531, __s2_531, 7, 6, 5, 4, 3, 2, 1, 0); \
  53962   __ret_531 = __rev0_531 - __noswap_vmull_u16(__rev1_531, __noswap_splat_laneq_u16(__rev2_531, __p3_531)); \
  53963   __ret_531 = __builtin_shufflevector(__ret_531, __ret_531, 3, 2, 1, 0); \
  53964   __ret_531; \
  53965 })
  53966 #endif
  53967 
  53968 #ifdef __LITTLE_ENDIAN__
  53969 #define vmlsl_laneq_s32(__p0_532, __p1_532, __p2_532, __p3_532) __extension__ ({ \
  53970   int64x2_t __ret_532; \
  53971   int64x2_t __s0_532 = __p0_532; \
  53972   int32x2_t __s1_532 = __p1_532; \
  53973   int32x4_t __s2_532 = __p2_532; \
  53974   __ret_532 = __s0_532 - vmull_s32(__s1_532, splat_laneq_s32(__s2_532, __p3_532)); \
  53975   __ret_532; \
  53976 })
  53977 #else
  53978 #define vmlsl_laneq_s32(__p0_533, __p1_533, __p2_533, __p3_533) __extension__ ({ \
  53979   int64x2_t __ret_533; \
  53980   int64x2_t __s0_533 = __p0_533; \
  53981   int32x2_t __s1_533 = __p1_533; \
  53982   int32x4_t __s2_533 = __p2_533; \
  53983   int64x2_t __rev0_533;  __rev0_533 = __builtin_shufflevector(__s0_533, __s0_533, 1, 0); \
  53984   int32x2_t __rev1_533;  __rev1_533 = __builtin_shufflevector(__s1_533, __s1_533, 1, 0); \
  53985   int32x4_t __rev2_533;  __rev2_533 = __builtin_shufflevector(__s2_533, __s2_533, 3, 2, 1, 0); \
  53986   __ret_533 = __rev0_533 - __noswap_vmull_s32(__rev1_533, __noswap_splat_laneq_s32(__rev2_533, __p3_533)); \
  53987   __ret_533 = __builtin_shufflevector(__ret_533, __ret_533, 1, 0); \
  53988   __ret_533; \
  53989 })
  53990 #endif
  53991 
  53992 #ifdef __LITTLE_ENDIAN__
  53993 #define vmlsl_laneq_s16(__p0_534, __p1_534, __p2_534, __p3_534) __extension__ ({ \
  53994   int32x4_t __ret_534; \
  53995   int32x4_t __s0_534 = __p0_534; \
  53996   int16x4_t __s1_534 = __p1_534; \
  53997   int16x8_t __s2_534 = __p2_534; \
  53998   __ret_534 = __s0_534 - vmull_s16(__s1_534, splat_laneq_s16(__s2_534, __p3_534)); \
  53999   __ret_534; \
  54000 })
  54001 #else
  54002 #define vmlsl_laneq_s16(__p0_535, __p1_535, __p2_535, __p3_535) __extension__ ({ \
  54003   int32x4_t __ret_535; \
  54004   int32x4_t __s0_535 = __p0_535; \
  54005   int16x4_t __s1_535 = __p1_535; \
  54006   int16x8_t __s2_535 = __p2_535; \
  54007   int32x4_t __rev0_535;  __rev0_535 = __builtin_shufflevector(__s0_535, __s0_535, 3, 2, 1, 0); \
  54008   int16x4_t __rev1_535;  __rev1_535 = __builtin_shufflevector(__s1_535, __s1_535, 3, 2, 1, 0); \
  54009   int16x8_t __rev2_535;  __rev2_535 = __builtin_shufflevector(__s2_535, __s2_535, 7, 6, 5, 4, 3, 2, 1, 0); \
  54010   __ret_535 = __rev0_535 - __noswap_vmull_s16(__rev1_535, __noswap_splat_laneq_s16(__rev2_535, __p3_535)); \
  54011   __ret_535 = __builtin_shufflevector(__ret_535, __ret_535, 3, 2, 1, 0); \
  54012   __ret_535; \
  54013 })
  54014 #endif
  54015 
  54016 __ai __attribute__((target("neon"))) poly64x1_t vmov_n_p64(poly64_t __p0) {
  54017   poly64x1_t __ret;
  54018   __ret = (poly64x1_t) {__p0};
  54019   return __ret;
  54020 }
  54021 #ifdef __LITTLE_ENDIAN__
  54022 __ai __attribute__((target("neon"))) poly64x2_t vmovq_n_p64(poly64_t __p0) {
  54023   poly64x2_t __ret;
  54024   __ret = (poly64x2_t) {__p0, __p0};
  54025   return __ret;
  54026 }
  54027 #else
  54028 __ai __attribute__((target("neon"))) poly64x2_t vmovq_n_p64(poly64_t __p0) {
  54029   poly64x2_t __ret;
  54030   __ret = (poly64x2_t) {__p0, __p0};
  54031   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54032   return __ret;
  54033 }
  54034 #endif
  54035 
  54036 #ifdef __LITTLE_ENDIAN__
  54037 __ai __attribute__((target("neon"))) float64x2_t vmovq_n_f64(float64_t __p0) {
  54038   float64x2_t __ret;
  54039   __ret = (float64x2_t) {__p0, __p0};
  54040   return __ret;
  54041 }
  54042 #else
  54043 __ai __attribute__((target("neon"))) float64x2_t vmovq_n_f64(float64_t __p0) {
  54044   float64x2_t __ret;
  54045   __ret = (float64x2_t) {__p0, __p0};
  54046   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54047   return __ret;
  54048 }
  54049 #endif
  54050 
  54051 __ai __attribute__((target("neon"))) float64x1_t vmov_n_f64(float64_t __p0) {
  54052   float64x1_t __ret;
  54053   __ret = (float64x1_t) {__p0};
  54054   return __ret;
  54055 }
  54056 #ifdef __LITTLE_ENDIAN__
  54057 __ai __attribute__((target("neon"))) uint16x8_t vmovl_high_u8(uint8x16_t __p0_536) {
  54058   uint16x8_t __ret_536;
  54059   uint8x8_t __a1_536 = vget_high_u8(__p0_536);
  54060   __ret_536 = (uint16x8_t)(vshll_n_u8(__a1_536, 0));
  54061   return __ret_536;
  54062 }
  54063 #else
  54064 __ai __attribute__((target("neon"))) uint16x8_t vmovl_high_u8(uint8x16_t __p0_537) {
  54065   uint16x8_t __ret_537;
  54066   uint8x16_t __rev0_537;  __rev0_537 = __builtin_shufflevector(__p0_537, __p0_537, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54067   uint8x8_t __a1_537 = __noswap_vget_high_u8(__rev0_537);
  54068   __ret_537 = (uint16x8_t)(__noswap_vshll_n_u8(__a1_537, 0));
  54069   __ret_537 = __builtin_shufflevector(__ret_537, __ret_537, 7, 6, 5, 4, 3, 2, 1, 0);
  54070   return __ret_537;
  54071 }
  54072 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmovl_high_u8(uint8x16_t __p0_538) {
  54073   uint16x8_t __ret_538;
  54074   uint8x8_t __a1_538 = __noswap_vget_high_u8(__p0_538);
  54075   __ret_538 = (uint16x8_t)(__noswap_vshll_n_u8(__a1_538, 0));
  54076   return __ret_538;
  54077 }
  54078 #endif
  54079 
  54080 #ifdef __LITTLE_ENDIAN__
  54081 __ai __attribute__((target("neon"))) uint64x2_t vmovl_high_u32(uint32x4_t __p0_539) {
  54082   uint64x2_t __ret_539;
  54083   uint32x2_t __a1_539 = vget_high_u32(__p0_539);
  54084   __ret_539 = (uint64x2_t)(vshll_n_u32(__a1_539, 0));
  54085   return __ret_539;
  54086 }
  54087 #else
  54088 __ai __attribute__((target("neon"))) uint64x2_t vmovl_high_u32(uint32x4_t __p0_540) {
  54089   uint64x2_t __ret_540;
  54090   uint32x4_t __rev0_540;  __rev0_540 = __builtin_shufflevector(__p0_540, __p0_540, 3, 2, 1, 0);
  54091   uint32x2_t __a1_540 = __noswap_vget_high_u32(__rev0_540);
  54092   __ret_540 = (uint64x2_t)(__noswap_vshll_n_u32(__a1_540, 0));
  54093   __ret_540 = __builtin_shufflevector(__ret_540, __ret_540, 1, 0);
  54094   return __ret_540;
  54095 }
  54096 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmovl_high_u32(uint32x4_t __p0_541) {
  54097   uint64x2_t __ret_541;
  54098   uint32x2_t __a1_541 = __noswap_vget_high_u32(__p0_541);
  54099   __ret_541 = (uint64x2_t)(__noswap_vshll_n_u32(__a1_541, 0));
  54100   return __ret_541;
  54101 }
  54102 #endif
  54103 
  54104 #ifdef __LITTLE_ENDIAN__
  54105 __ai __attribute__((target("neon"))) uint32x4_t vmovl_high_u16(uint16x8_t __p0_542) {
  54106   uint32x4_t __ret_542;
  54107   uint16x4_t __a1_542 = vget_high_u16(__p0_542);
  54108   __ret_542 = (uint32x4_t)(vshll_n_u16(__a1_542, 0));
  54109   return __ret_542;
  54110 }
  54111 #else
  54112 __ai __attribute__((target("neon"))) uint32x4_t vmovl_high_u16(uint16x8_t __p0_543) {
  54113   uint32x4_t __ret_543;
  54114   uint16x8_t __rev0_543;  __rev0_543 = __builtin_shufflevector(__p0_543, __p0_543, 7, 6, 5, 4, 3, 2, 1, 0);
  54115   uint16x4_t __a1_543 = __noswap_vget_high_u16(__rev0_543);
  54116   __ret_543 = (uint32x4_t)(__noswap_vshll_n_u16(__a1_543, 0));
  54117   __ret_543 = __builtin_shufflevector(__ret_543, __ret_543, 3, 2, 1, 0);
  54118   return __ret_543;
  54119 }
  54120 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmovl_high_u16(uint16x8_t __p0_544) {
  54121   uint32x4_t __ret_544;
  54122   uint16x4_t __a1_544 = __noswap_vget_high_u16(__p0_544);
  54123   __ret_544 = (uint32x4_t)(__noswap_vshll_n_u16(__a1_544, 0));
  54124   return __ret_544;
  54125 }
  54126 #endif
  54127 
  54128 #ifdef __LITTLE_ENDIAN__
  54129 __ai __attribute__((target("neon"))) int16x8_t vmovl_high_s8(int8x16_t __p0_545) {
  54130   int16x8_t __ret_545;
  54131   int8x8_t __a1_545 = vget_high_s8(__p0_545);
  54132   __ret_545 = (int16x8_t)(vshll_n_s8(__a1_545, 0));
  54133   return __ret_545;
  54134 }
  54135 #else
  54136 __ai __attribute__((target("neon"))) int16x8_t vmovl_high_s8(int8x16_t __p0_546) {
  54137   int16x8_t __ret_546;
  54138   int8x16_t __rev0_546;  __rev0_546 = __builtin_shufflevector(__p0_546, __p0_546, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54139   int8x8_t __a1_546 = __noswap_vget_high_s8(__rev0_546);
  54140   __ret_546 = (int16x8_t)(__noswap_vshll_n_s8(__a1_546, 0));
  54141   __ret_546 = __builtin_shufflevector(__ret_546, __ret_546, 7, 6, 5, 4, 3, 2, 1, 0);
  54142   return __ret_546;
  54143 }
  54144 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmovl_high_s8(int8x16_t __p0_547) {
  54145   int16x8_t __ret_547;
  54146   int8x8_t __a1_547 = __noswap_vget_high_s8(__p0_547);
  54147   __ret_547 = (int16x8_t)(__noswap_vshll_n_s8(__a1_547, 0));
  54148   return __ret_547;
  54149 }
  54150 #endif
  54151 
  54152 #ifdef __LITTLE_ENDIAN__
  54153 __ai __attribute__((target("neon"))) int64x2_t vmovl_high_s32(int32x4_t __p0_548) {
  54154   int64x2_t __ret_548;
  54155   int32x2_t __a1_548 = vget_high_s32(__p0_548);
  54156   __ret_548 = (int64x2_t)(vshll_n_s32(__a1_548, 0));
  54157   return __ret_548;
  54158 }
  54159 #else
  54160 __ai __attribute__((target("neon"))) int64x2_t vmovl_high_s32(int32x4_t __p0_549) {
  54161   int64x2_t __ret_549;
  54162   int32x4_t __rev0_549;  __rev0_549 = __builtin_shufflevector(__p0_549, __p0_549, 3, 2, 1, 0);
  54163   int32x2_t __a1_549 = __noswap_vget_high_s32(__rev0_549);
  54164   __ret_549 = (int64x2_t)(__noswap_vshll_n_s32(__a1_549, 0));
  54165   __ret_549 = __builtin_shufflevector(__ret_549, __ret_549, 1, 0);
  54166   return __ret_549;
  54167 }
  54168 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmovl_high_s32(int32x4_t __p0_550) {
  54169   int64x2_t __ret_550;
  54170   int32x2_t __a1_550 = __noswap_vget_high_s32(__p0_550);
  54171   __ret_550 = (int64x2_t)(__noswap_vshll_n_s32(__a1_550, 0));
  54172   return __ret_550;
  54173 }
  54174 #endif
  54175 
  54176 #ifdef __LITTLE_ENDIAN__
  54177 __ai __attribute__((target("neon"))) int32x4_t vmovl_high_s16(int16x8_t __p0_551) {
  54178   int32x4_t __ret_551;
  54179   int16x4_t __a1_551 = vget_high_s16(__p0_551);
  54180   __ret_551 = (int32x4_t)(vshll_n_s16(__a1_551, 0));
  54181   return __ret_551;
  54182 }
  54183 #else
  54184 __ai __attribute__((target("neon"))) int32x4_t vmovl_high_s16(int16x8_t __p0_552) {
  54185   int32x4_t __ret_552;
  54186   int16x8_t __rev0_552;  __rev0_552 = __builtin_shufflevector(__p0_552, __p0_552, 7, 6, 5, 4, 3, 2, 1, 0);
  54187   int16x4_t __a1_552 = __noswap_vget_high_s16(__rev0_552);
  54188   __ret_552 = (int32x4_t)(__noswap_vshll_n_s16(__a1_552, 0));
  54189   __ret_552 = __builtin_shufflevector(__ret_552, __ret_552, 3, 2, 1, 0);
  54190   return __ret_552;
  54191 }
  54192 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmovl_high_s16(int16x8_t __p0_553) {
  54193   int32x4_t __ret_553;
  54194   int16x4_t __a1_553 = __noswap_vget_high_s16(__p0_553);
  54195   __ret_553 = (int32x4_t)(__noswap_vshll_n_s16(__a1_553, 0));
  54196   return __ret_553;
  54197 }
  54198 #endif
  54199 
  54200 #ifdef __LITTLE_ENDIAN__
  54201 __ai __attribute__((target("neon"))) uint16x8_t vmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) {
  54202   uint16x8_t __ret;
  54203   __ret = vcombine_u16(__p0, vmovn_u32(__p1));
  54204   return __ret;
  54205 }
  54206 #else
  54207 __ai __attribute__((target("neon"))) uint16x8_t vmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) {
  54208   uint16x8_t __ret;
  54209   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  54210   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  54211   __ret = __noswap_vcombine_u16(__rev0, __noswap_vmovn_u32(__rev1));
  54212   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  54213   return __ret;
  54214 }
  54215 #endif
  54216 
  54217 #ifdef __LITTLE_ENDIAN__
  54218 __ai __attribute__((target("neon"))) uint32x4_t vmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) {
  54219   uint32x4_t __ret;
  54220   __ret = vcombine_u32(__p0, vmovn_u64(__p1));
  54221   return __ret;
  54222 }
  54223 #else
  54224 __ai __attribute__((target("neon"))) uint32x4_t vmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) {
  54225   uint32x4_t __ret;
  54226   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  54227   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  54228   __ret = __noswap_vcombine_u32(__rev0, __noswap_vmovn_u64(__rev1));
  54229   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  54230   return __ret;
  54231 }
  54232 #endif
  54233 
  54234 #ifdef __LITTLE_ENDIAN__
  54235 __ai __attribute__((target("neon"))) uint8x16_t vmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) {
  54236   uint8x16_t __ret;
  54237   __ret = vcombine_u8(__p0, vmovn_u16(__p1));
  54238   return __ret;
  54239 }
  54240 #else
  54241 __ai __attribute__((target("neon"))) uint8x16_t vmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) {
  54242   uint8x16_t __ret;
  54243   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  54244   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  54245   __ret = __noswap_vcombine_u8(__rev0, __noswap_vmovn_u16(__rev1));
  54246   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54247   return __ret;
  54248 }
  54249 #endif
  54250 
  54251 #ifdef __LITTLE_ENDIAN__
  54252 __ai __attribute__((target("neon"))) int16x8_t vmovn_high_s32(int16x4_t __p0, int32x4_t __p1) {
  54253   int16x8_t __ret;
  54254   __ret = vcombine_s16(__p0, vmovn_s32(__p1));
  54255   return __ret;
  54256 }
  54257 #else
  54258 __ai __attribute__((target("neon"))) int16x8_t vmovn_high_s32(int16x4_t __p0, int32x4_t __p1) {
  54259   int16x8_t __ret;
  54260   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  54261   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  54262   __ret = __noswap_vcombine_s16(__rev0, __noswap_vmovn_s32(__rev1));
  54263   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  54264   return __ret;
  54265 }
  54266 #endif
  54267 
  54268 #ifdef __LITTLE_ENDIAN__
  54269 __ai __attribute__((target("neon"))) int32x4_t vmovn_high_s64(int32x2_t __p0, int64x2_t __p1) {
  54270   int32x4_t __ret;
  54271   __ret = vcombine_s32(__p0, vmovn_s64(__p1));
  54272   return __ret;
  54273 }
  54274 #else
  54275 __ai __attribute__((target("neon"))) int32x4_t vmovn_high_s64(int32x2_t __p0, int64x2_t __p1) {
  54276   int32x4_t __ret;
  54277   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  54278   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  54279   __ret = __noswap_vcombine_s32(__rev0, __noswap_vmovn_s64(__rev1));
  54280   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  54281   return __ret;
  54282 }
  54283 #endif
  54284 
  54285 #ifdef __LITTLE_ENDIAN__
  54286 __ai __attribute__((target("neon"))) int8x16_t vmovn_high_s16(int8x8_t __p0, int16x8_t __p1) {
  54287   int8x16_t __ret;
  54288   __ret = vcombine_s8(__p0, vmovn_s16(__p1));
  54289   return __ret;
  54290 }
  54291 #else
  54292 __ai __attribute__((target("neon"))) int8x16_t vmovn_high_s16(int8x8_t __p0, int16x8_t __p1) {
  54293   int8x16_t __ret;
  54294   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  54295   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  54296   __ret = __noswap_vcombine_s8(__rev0, __noswap_vmovn_s16(__rev1));
  54297   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54298   return __ret;
  54299 }
  54300 #endif
  54301 
  54302 #ifdef __LITTLE_ENDIAN__
  54303 __ai __attribute__((target("neon"))) float64x2_t vmulq_f64(float64x2_t __p0, float64x2_t __p1) {
  54304   float64x2_t __ret;
  54305   __ret = __p0 * __p1;
  54306   return __ret;
  54307 }
  54308 #else
  54309 __ai __attribute__((target("neon"))) float64x2_t vmulq_f64(float64x2_t __p0, float64x2_t __p1) {
  54310   float64x2_t __ret;
  54311   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  54312   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  54313   __ret = __rev0 * __rev1;
  54314   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54315   return __ret;
  54316 }
  54317 #endif
  54318 
  54319 __ai __attribute__((target("neon"))) float64x1_t vmul_f64(float64x1_t __p0, float64x1_t __p1) {
  54320   float64x1_t __ret;
  54321   __ret = __p0 * __p1;
  54322   return __ret;
  54323 }
  54324 #define vmuld_lane_f64(__p0_554, __p1_554, __p2_554) __extension__ ({ \
  54325   float64_t __ret_554; \
  54326   float64_t __s0_554 = __p0_554; \
  54327   float64x1_t __s1_554 = __p1_554; \
  54328   __ret_554 = __s0_554 * vget_lane_f64(__s1_554, __p2_554); \
  54329   __ret_554; \
  54330 })
  54331 #ifdef __LITTLE_ENDIAN__
  54332 #define vmuls_lane_f32(__p0_555, __p1_555, __p2_555) __extension__ ({ \
  54333   float32_t __ret_555; \
  54334   float32_t __s0_555 = __p0_555; \
  54335   float32x2_t __s1_555 = __p1_555; \
  54336   __ret_555 = __s0_555 * vget_lane_f32(__s1_555, __p2_555); \
  54337   __ret_555; \
  54338 })
  54339 #else
  54340 #define vmuls_lane_f32(__p0_556, __p1_556, __p2_556) __extension__ ({ \
  54341   float32_t __ret_556; \
  54342   float32_t __s0_556 = __p0_556; \
  54343   float32x2_t __s1_556 = __p1_556; \
  54344   float32x2_t __rev1_556;  __rev1_556 = __builtin_shufflevector(__s1_556, __s1_556, 1, 0); \
  54345   __ret_556 = __s0_556 * __noswap_vget_lane_f32(__rev1_556, __p2_556); \
  54346   __ret_556; \
  54347 })
  54348 #endif
  54349 
  54350 #define vmul_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  54351   float64x1_t __ret; \
  54352   float64x1_t __s0 = __p0; \
  54353   float64x1_t __s1 = __p1; \
  54354   __ret = (float64x1_t) __builtin_neon_vmul_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 10); \
  54355   __ret; \
  54356 })
  54357 #ifdef __LITTLE_ENDIAN__
  54358 #define vmulq_lane_f64(__p0_557, __p1_557, __p2_557) __extension__ ({ \
  54359   float64x2_t __ret_557; \
  54360   float64x2_t __s0_557 = __p0_557; \
  54361   float64x1_t __s1_557 = __p1_557; \
  54362   __ret_557 = __s0_557 * splatq_lane_f64(__s1_557, __p2_557); \
  54363   __ret_557; \
  54364 })
  54365 #else
  54366 #define vmulq_lane_f64(__p0_558, __p1_558, __p2_558) __extension__ ({ \
  54367   float64x2_t __ret_558; \
  54368   float64x2_t __s0_558 = __p0_558; \
  54369   float64x1_t __s1_558 = __p1_558; \
  54370   float64x2_t __rev0_558;  __rev0_558 = __builtin_shufflevector(__s0_558, __s0_558, 1, 0); \
  54371   __ret_558 = __rev0_558 * __noswap_splatq_lane_f64(__s1_558, __p2_558); \
  54372   __ret_558 = __builtin_shufflevector(__ret_558, __ret_558, 1, 0); \
  54373   __ret_558; \
  54374 })
  54375 #endif
  54376 
  54377 #ifdef __LITTLE_ENDIAN__
  54378 #define vmuld_laneq_f64(__p0_559, __p1_559, __p2_559) __extension__ ({ \
  54379   float64_t __ret_559; \
  54380   float64_t __s0_559 = __p0_559; \
  54381   float64x2_t __s1_559 = __p1_559; \
  54382   __ret_559 = __s0_559 * vgetq_lane_f64(__s1_559, __p2_559); \
  54383   __ret_559; \
  54384 })
  54385 #else
  54386 #define vmuld_laneq_f64(__p0_560, __p1_560, __p2_560) __extension__ ({ \
  54387   float64_t __ret_560; \
  54388   float64_t __s0_560 = __p0_560; \
  54389   float64x2_t __s1_560 = __p1_560; \
  54390   float64x2_t __rev1_560;  __rev1_560 = __builtin_shufflevector(__s1_560, __s1_560, 1, 0); \
  54391   __ret_560 = __s0_560 * __noswap_vgetq_lane_f64(__rev1_560, __p2_560); \
  54392   __ret_560; \
  54393 })
  54394 #endif
  54395 
  54396 #ifdef __LITTLE_ENDIAN__
  54397 #define vmuls_laneq_f32(__p0_561, __p1_561, __p2_561) __extension__ ({ \
  54398   float32_t __ret_561; \
  54399   float32_t __s0_561 = __p0_561; \
  54400   float32x4_t __s1_561 = __p1_561; \
  54401   __ret_561 = __s0_561 * vgetq_lane_f32(__s1_561, __p2_561); \
  54402   __ret_561; \
  54403 })
  54404 #else
  54405 #define vmuls_laneq_f32(__p0_562, __p1_562, __p2_562) __extension__ ({ \
  54406   float32_t __ret_562; \
  54407   float32_t __s0_562 = __p0_562; \
  54408   float32x4_t __s1_562 = __p1_562; \
  54409   float32x4_t __rev1_562;  __rev1_562 = __builtin_shufflevector(__s1_562, __s1_562, 3, 2, 1, 0); \
  54410   __ret_562 = __s0_562 * __noswap_vgetq_lane_f32(__rev1_562, __p2_562); \
  54411   __ret_562; \
  54412 })
  54413 #endif
  54414 
  54415 #ifdef __LITTLE_ENDIAN__
  54416 #define vmul_laneq_f64(__p0, __p1, __p2) __extension__ ({ \
  54417   float64x1_t __ret; \
  54418   float64x1_t __s0 = __p0; \
  54419   float64x2_t __s1 = __p1; \
  54420   __ret = (float64x1_t) __builtin_neon_vmul_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 10); \
  54421   __ret; \
  54422 })
  54423 #else
  54424 #define vmul_laneq_f64(__p0, __p1, __p2) __extension__ ({ \
  54425   float64x1_t __ret; \
  54426   float64x1_t __s0 = __p0; \
  54427   float64x2_t __s1 = __p1; \
  54428   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  54429   __ret = (float64x1_t) __builtin_neon_vmul_laneq_v((int8x8_t)__s0, (int8x16_t)__rev1, __p2, 10); \
  54430   __ret; \
  54431 })
  54432 #endif
  54433 
  54434 #ifdef __LITTLE_ENDIAN__
  54435 #define vmulq_laneq_u32(__p0_563, __p1_563, __p2_563) __extension__ ({ \
  54436   uint32x4_t __ret_563; \
  54437   uint32x4_t __s0_563 = __p0_563; \
  54438   uint32x4_t __s1_563 = __p1_563; \
  54439   __ret_563 = __s0_563 * splatq_laneq_u32(__s1_563, __p2_563); \
  54440   __ret_563; \
  54441 })
  54442 #else
  54443 #define vmulq_laneq_u32(__p0_564, __p1_564, __p2_564) __extension__ ({ \
  54444   uint32x4_t __ret_564; \
  54445   uint32x4_t __s0_564 = __p0_564; \
  54446   uint32x4_t __s1_564 = __p1_564; \
  54447   uint32x4_t __rev0_564;  __rev0_564 = __builtin_shufflevector(__s0_564, __s0_564, 3, 2, 1, 0); \
  54448   uint32x4_t __rev1_564;  __rev1_564 = __builtin_shufflevector(__s1_564, __s1_564, 3, 2, 1, 0); \
  54449   __ret_564 = __rev0_564 * __noswap_splatq_laneq_u32(__rev1_564, __p2_564); \
  54450   __ret_564 = __builtin_shufflevector(__ret_564, __ret_564, 3, 2, 1, 0); \
  54451   __ret_564; \
  54452 })
  54453 #endif
  54454 
  54455 #ifdef __LITTLE_ENDIAN__
  54456 #define vmulq_laneq_u16(__p0_565, __p1_565, __p2_565) __extension__ ({ \
  54457   uint16x8_t __ret_565; \
  54458   uint16x8_t __s0_565 = __p0_565; \
  54459   uint16x8_t __s1_565 = __p1_565; \
  54460   __ret_565 = __s0_565 * splatq_laneq_u16(__s1_565, __p2_565); \
  54461   __ret_565; \
  54462 })
  54463 #else
  54464 #define vmulq_laneq_u16(__p0_566, __p1_566, __p2_566) __extension__ ({ \
  54465   uint16x8_t __ret_566; \
  54466   uint16x8_t __s0_566 = __p0_566; \
  54467   uint16x8_t __s1_566 = __p1_566; \
  54468   uint16x8_t __rev0_566;  __rev0_566 = __builtin_shufflevector(__s0_566, __s0_566, 7, 6, 5, 4, 3, 2, 1, 0); \
  54469   uint16x8_t __rev1_566;  __rev1_566 = __builtin_shufflevector(__s1_566, __s1_566, 7, 6, 5, 4, 3, 2, 1, 0); \
  54470   __ret_566 = __rev0_566 * __noswap_splatq_laneq_u16(__rev1_566, __p2_566); \
  54471   __ret_566 = __builtin_shufflevector(__ret_566, __ret_566, 7, 6, 5, 4, 3, 2, 1, 0); \
  54472   __ret_566; \
  54473 })
  54474 #endif
  54475 
  54476 #ifdef __LITTLE_ENDIAN__
  54477 #define vmulq_laneq_f64(__p0_567, __p1_567, __p2_567) __extension__ ({ \
  54478   float64x2_t __ret_567; \
  54479   float64x2_t __s0_567 = __p0_567; \
  54480   float64x2_t __s1_567 = __p1_567; \
  54481   __ret_567 = __s0_567 * splatq_laneq_f64(__s1_567, __p2_567); \
  54482   __ret_567; \
  54483 })
  54484 #else
  54485 #define vmulq_laneq_f64(__p0_568, __p1_568, __p2_568) __extension__ ({ \
  54486   float64x2_t __ret_568; \
  54487   float64x2_t __s0_568 = __p0_568; \
  54488   float64x2_t __s1_568 = __p1_568; \
  54489   float64x2_t __rev0_568;  __rev0_568 = __builtin_shufflevector(__s0_568, __s0_568, 1, 0); \
  54490   float64x2_t __rev1_568;  __rev1_568 = __builtin_shufflevector(__s1_568, __s1_568, 1, 0); \
  54491   __ret_568 = __rev0_568 * __noswap_splatq_laneq_f64(__rev1_568, __p2_568); \
  54492   __ret_568 = __builtin_shufflevector(__ret_568, __ret_568, 1, 0); \
  54493   __ret_568; \
  54494 })
  54495 #endif
  54496 
  54497 #ifdef __LITTLE_ENDIAN__
  54498 #define vmulq_laneq_f32(__p0_569, __p1_569, __p2_569) __extension__ ({ \
  54499   float32x4_t __ret_569; \
  54500   float32x4_t __s0_569 = __p0_569; \
  54501   float32x4_t __s1_569 = __p1_569; \
  54502   __ret_569 = __s0_569 * splatq_laneq_f32(__s1_569, __p2_569); \
  54503   __ret_569; \
  54504 })
  54505 #else
  54506 #define vmulq_laneq_f32(__p0_570, __p1_570, __p2_570) __extension__ ({ \
  54507   float32x4_t __ret_570; \
  54508   float32x4_t __s0_570 = __p0_570; \
  54509   float32x4_t __s1_570 = __p1_570; \
  54510   float32x4_t __rev0_570;  __rev0_570 = __builtin_shufflevector(__s0_570, __s0_570, 3, 2, 1, 0); \
  54511   float32x4_t __rev1_570;  __rev1_570 = __builtin_shufflevector(__s1_570, __s1_570, 3, 2, 1, 0); \
  54512   __ret_570 = __rev0_570 * __noswap_splatq_laneq_f32(__rev1_570, __p2_570); \
  54513   __ret_570 = __builtin_shufflevector(__ret_570, __ret_570, 3, 2, 1, 0); \
  54514   __ret_570; \
  54515 })
  54516 #endif
  54517 
  54518 #ifdef __LITTLE_ENDIAN__
  54519 #define vmulq_laneq_s32(__p0_571, __p1_571, __p2_571) __extension__ ({ \
  54520   int32x4_t __ret_571; \
  54521   int32x4_t __s0_571 = __p0_571; \
  54522   int32x4_t __s1_571 = __p1_571; \
  54523   __ret_571 = __s0_571 * splatq_laneq_s32(__s1_571, __p2_571); \
  54524   __ret_571; \
  54525 })
  54526 #else
  54527 #define vmulq_laneq_s32(__p0_572, __p1_572, __p2_572) __extension__ ({ \
  54528   int32x4_t __ret_572; \
  54529   int32x4_t __s0_572 = __p0_572; \
  54530   int32x4_t __s1_572 = __p1_572; \
  54531   int32x4_t __rev0_572;  __rev0_572 = __builtin_shufflevector(__s0_572, __s0_572, 3, 2, 1, 0); \
  54532   int32x4_t __rev1_572;  __rev1_572 = __builtin_shufflevector(__s1_572, __s1_572, 3, 2, 1, 0); \
  54533   __ret_572 = __rev0_572 * __noswap_splatq_laneq_s32(__rev1_572, __p2_572); \
  54534   __ret_572 = __builtin_shufflevector(__ret_572, __ret_572, 3, 2, 1, 0); \
  54535   __ret_572; \
  54536 })
  54537 #endif
  54538 
  54539 #ifdef __LITTLE_ENDIAN__
  54540 #define vmulq_laneq_s16(__p0_573, __p1_573, __p2_573) __extension__ ({ \
  54541   int16x8_t __ret_573; \
  54542   int16x8_t __s0_573 = __p0_573; \
  54543   int16x8_t __s1_573 = __p1_573; \
  54544   __ret_573 = __s0_573 * splatq_laneq_s16(__s1_573, __p2_573); \
  54545   __ret_573; \
  54546 })
  54547 #else
  54548 #define vmulq_laneq_s16(__p0_574, __p1_574, __p2_574) __extension__ ({ \
  54549   int16x8_t __ret_574; \
  54550   int16x8_t __s0_574 = __p0_574; \
  54551   int16x8_t __s1_574 = __p1_574; \
  54552   int16x8_t __rev0_574;  __rev0_574 = __builtin_shufflevector(__s0_574, __s0_574, 7, 6, 5, 4, 3, 2, 1, 0); \
  54553   int16x8_t __rev1_574;  __rev1_574 = __builtin_shufflevector(__s1_574, __s1_574, 7, 6, 5, 4, 3, 2, 1, 0); \
  54554   __ret_574 = __rev0_574 * __noswap_splatq_laneq_s16(__rev1_574, __p2_574); \
  54555   __ret_574 = __builtin_shufflevector(__ret_574, __ret_574, 7, 6, 5, 4, 3, 2, 1, 0); \
  54556   __ret_574; \
  54557 })
  54558 #endif
  54559 
  54560 #ifdef __LITTLE_ENDIAN__
  54561 #define vmul_laneq_u32(__p0_575, __p1_575, __p2_575) __extension__ ({ \
  54562   uint32x2_t __ret_575; \
  54563   uint32x2_t __s0_575 = __p0_575; \
  54564   uint32x4_t __s1_575 = __p1_575; \
  54565   __ret_575 = __s0_575 * splat_laneq_u32(__s1_575, __p2_575); \
  54566   __ret_575; \
  54567 })
  54568 #else
  54569 #define vmul_laneq_u32(__p0_576, __p1_576, __p2_576) __extension__ ({ \
  54570   uint32x2_t __ret_576; \
  54571   uint32x2_t __s0_576 = __p0_576; \
  54572   uint32x4_t __s1_576 = __p1_576; \
  54573   uint32x2_t __rev0_576;  __rev0_576 = __builtin_shufflevector(__s0_576, __s0_576, 1, 0); \
  54574   uint32x4_t __rev1_576;  __rev1_576 = __builtin_shufflevector(__s1_576, __s1_576, 3, 2, 1, 0); \
  54575   __ret_576 = __rev0_576 * __noswap_splat_laneq_u32(__rev1_576, __p2_576); \
  54576   __ret_576 = __builtin_shufflevector(__ret_576, __ret_576, 1, 0); \
  54577   __ret_576; \
  54578 })
  54579 #endif
  54580 
  54581 #ifdef __LITTLE_ENDIAN__
  54582 #define vmul_laneq_u16(__p0_577, __p1_577, __p2_577) __extension__ ({ \
  54583   uint16x4_t __ret_577; \
  54584   uint16x4_t __s0_577 = __p0_577; \
  54585   uint16x8_t __s1_577 = __p1_577; \
  54586   __ret_577 = __s0_577 * splat_laneq_u16(__s1_577, __p2_577); \
  54587   __ret_577; \
  54588 })
  54589 #else
  54590 #define vmul_laneq_u16(__p0_578, __p1_578, __p2_578) __extension__ ({ \
  54591   uint16x4_t __ret_578; \
  54592   uint16x4_t __s0_578 = __p0_578; \
  54593   uint16x8_t __s1_578 = __p1_578; \
  54594   uint16x4_t __rev0_578;  __rev0_578 = __builtin_shufflevector(__s0_578, __s0_578, 3, 2, 1, 0); \
  54595   uint16x8_t __rev1_578;  __rev1_578 = __builtin_shufflevector(__s1_578, __s1_578, 7, 6, 5, 4, 3, 2, 1, 0); \
  54596   __ret_578 = __rev0_578 * __noswap_splat_laneq_u16(__rev1_578, __p2_578); \
  54597   __ret_578 = __builtin_shufflevector(__ret_578, __ret_578, 3, 2, 1, 0); \
  54598   __ret_578; \
  54599 })
  54600 #endif
  54601 
  54602 #ifdef __LITTLE_ENDIAN__
  54603 #define vmul_laneq_f32(__p0_579, __p1_579, __p2_579) __extension__ ({ \
  54604   float32x2_t __ret_579; \
  54605   float32x2_t __s0_579 = __p0_579; \
  54606   float32x4_t __s1_579 = __p1_579; \
  54607   __ret_579 = __s0_579 * splat_laneq_f32(__s1_579, __p2_579); \
  54608   __ret_579; \
  54609 })
  54610 #else
  54611 #define vmul_laneq_f32(__p0_580, __p1_580, __p2_580) __extension__ ({ \
  54612   float32x2_t __ret_580; \
  54613   float32x2_t __s0_580 = __p0_580; \
  54614   float32x4_t __s1_580 = __p1_580; \
  54615   float32x2_t __rev0_580;  __rev0_580 = __builtin_shufflevector(__s0_580, __s0_580, 1, 0); \
  54616   float32x4_t __rev1_580;  __rev1_580 = __builtin_shufflevector(__s1_580, __s1_580, 3, 2, 1, 0); \
  54617   __ret_580 = __rev0_580 * __noswap_splat_laneq_f32(__rev1_580, __p2_580); \
  54618   __ret_580 = __builtin_shufflevector(__ret_580, __ret_580, 1, 0); \
  54619   __ret_580; \
  54620 })
  54621 #endif
  54622 
  54623 #ifdef __LITTLE_ENDIAN__
  54624 #define vmul_laneq_s32(__p0_581, __p1_581, __p2_581) __extension__ ({ \
  54625   int32x2_t __ret_581; \
  54626   int32x2_t __s0_581 = __p0_581; \
  54627   int32x4_t __s1_581 = __p1_581; \
  54628   __ret_581 = __s0_581 * splat_laneq_s32(__s1_581, __p2_581); \
  54629   __ret_581; \
  54630 })
  54631 #else
  54632 #define vmul_laneq_s32(__p0_582, __p1_582, __p2_582) __extension__ ({ \
  54633   int32x2_t __ret_582; \
  54634   int32x2_t __s0_582 = __p0_582; \
  54635   int32x4_t __s1_582 = __p1_582; \
  54636   int32x2_t __rev0_582;  __rev0_582 = __builtin_shufflevector(__s0_582, __s0_582, 1, 0); \
  54637   int32x4_t __rev1_582;  __rev1_582 = __builtin_shufflevector(__s1_582, __s1_582, 3, 2, 1, 0); \
  54638   __ret_582 = __rev0_582 * __noswap_splat_laneq_s32(__rev1_582, __p2_582); \
  54639   __ret_582 = __builtin_shufflevector(__ret_582, __ret_582, 1, 0); \
  54640   __ret_582; \
  54641 })
  54642 #endif
  54643 
  54644 #ifdef __LITTLE_ENDIAN__
  54645 #define vmul_laneq_s16(__p0_583, __p1_583, __p2_583) __extension__ ({ \
  54646   int16x4_t __ret_583; \
  54647   int16x4_t __s0_583 = __p0_583; \
  54648   int16x8_t __s1_583 = __p1_583; \
  54649   __ret_583 = __s0_583 * splat_laneq_s16(__s1_583, __p2_583); \
  54650   __ret_583; \
  54651 })
  54652 #else
  54653 #define vmul_laneq_s16(__p0_584, __p1_584, __p2_584) __extension__ ({ \
  54654   int16x4_t __ret_584; \
  54655   int16x4_t __s0_584 = __p0_584; \
  54656   int16x8_t __s1_584 = __p1_584; \
  54657   int16x4_t __rev0_584;  __rev0_584 = __builtin_shufflevector(__s0_584, __s0_584, 3, 2, 1, 0); \
  54658   int16x8_t __rev1_584;  __rev1_584 = __builtin_shufflevector(__s1_584, __s1_584, 7, 6, 5, 4, 3, 2, 1, 0); \
  54659   __ret_584 = __rev0_584 * __noswap_splat_laneq_s16(__rev1_584, __p2_584); \
  54660   __ret_584 = __builtin_shufflevector(__ret_584, __ret_584, 3, 2, 1, 0); \
  54661   __ret_584; \
  54662 })
  54663 #endif
  54664 
  54665 __ai __attribute__((target("neon"))) float64x1_t vmul_n_f64(float64x1_t __p0, float64_t __p1) {
  54666   float64x1_t __ret;
  54667   __ret = (float64x1_t) __builtin_neon_vmul_n_f64((float64x1_t)__p0, __p1);
  54668   return __ret;
  54669 }
  54670 #ifdef __LITTLE_ENDIAN__
  54671 __ai __attribute__((target("neon"))) float64x2_t vmulq_n_f64(float64x2_t __p0, float64_t __p1) {
  54672   float64x2_t __ret;
  54673   __ret = __p0 * (float64x2_t) {__p1, __p1};
  54674   return __ret;
  54675 }
  54676 #else
  54677 __ai __attribute__((target("neon"))) float64x2_t vmulq_n_f64(float64x2_t __p0, float64_t __p1) {
  54678   float64x2_t __ret;
  54679   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  54680   __ret = __rev0 * (float64x2_t) {__p1, __p1};
  54681   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54682   return __ret;
  54683 }
  54684 #endif
  54685 
  54686 #ifdef __LITTLE_ENDIAN__
  54687 __ai __attribute__((target("neon"))) poly16x8_t vmull_high_p8(poly8x16_t __p0, poly8x16_t __p1) {
  54688   poly16x8_t __ret;
  54689   __ret = vmull_p8(vget_high_p8(__p0), vget_high_p8(__p1));
  54690   return __ret;
  54691 }
  54692 #else
  54693 __ai __attribute__((target("neon"))) poly16x8_t vmull_high_p8(poly8x16_t __p0, poly8x16_t __p1) {
  54694   poly16x8_t __ret;
  54695   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54696   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54697   __ret = __noswap_vmull_p8(__noswap_vget_high_p8(__rev0), __noswap_vget_high_p8(__rev1));
  54698   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  54699   return __ret;
  54700 }
  54701 #endif
  54702 
  54703 #ifdef __LITTLE_ENDIAN__
  54704 __ai __attribute__((target("neon"))) uint16x8_t vmull_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  54705   uint16x8_t __ret;
  54706   __ret = vmull_u8(vget_high_u8(__p0), vget_high_u8(__p1));
  54707   return __ret;
  54708 }
  54709 #else
  54710 __ai __attribute__((target("neon"))) uint16x8_t vmull_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  54711   uint16x8_t __ret;
  54712   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54713   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54714   __ret = __noswap_vmull_u8(__noswap_vget_high_u8(__rev0), __noswap_vget_high_u8(__rev1));
  54715   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  54716   return __ret;
  54717 }
  54718 #endif
  54719 
  54720 #ifdef __LITTLE_ENDIAN__
  54721 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  54722   uint64x2_t __ret;
  54723   __ret = vmull_u32(vget_high_u32(__p0), vget_high_u32(__p1));
  54724   return __ret;
  54725 }
  54726 #else
  54727 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  54728   uint64x2_t __ret;
  54729   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  54730   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  54731   __ret = __noswap_vmull_u32(__noswap_vget_high_u32(__rev0), __noswap_vget_high_u32(__rev1));
  54732   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54733   return __ret;
  54734 }
  54735 #endif
  54736 
  54737 #ifdef __LITTLE_ENDIAN__
  54738 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  54739   uint32x4_t __ret;
  54740   __ret = vmull_u16(vget_high_u16(__p0), vget_high_u16(__p1));
  54741   return __ret;
  54742 }
  54743 #else
  54744 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  54745   uint32x4_t __ret;
  54746   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  54747   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  54748   __ret = __noswap_vmull_u16(__noswap_vget_high_u16(__rev0), __noswap_vget_high_u16(__rev1));
  54749   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  54750   return __ret;
  54751 }
  54752 #endif
  54753 
  54754 #ifdef __LITTLE_ENDIAN__
  54755 __ai __attribute__((target("neon"))) int16x8_t vmull_high_s8(int8x16_t __p0, int8x16_t __p1) {
  54756   int16x8_t __ret;
  54757   __ret = vmull_s8(vget_high_s8(__p0), vget_high_s8(__p1));
  54758   return __ret;
  54759 }
  54760 #else
  54761 __ai __attribute__((target("neon"))) int16x8_t vmull_high_s8(int8x16_t __p0, int8x16_t __p1) {
  54762   int16x8_t __ret;
  54763   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54764   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  54765   __ret = __noswap_vmull_s8(__noswap_vget_high_s8(__rev0), __noswap_vget_high_s8(__rev1));
  54766   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  54767   return __ret;
  54768 }
  54769 #endif
  54770 
  54771 #ifdef __LITTLE_ENDIAN__
  54772 __ai __attribute__((target("neon"))) int64x2_t vmull_high_s32(int32x4_t __p0, int32x4_t __p1) {
  54773   int64x2_t __ret;
  54774   __ret = vmull_s32(vget_high_s32(__p0), vget_high_s32(__p1));
  54775   return __ret;
  54776 }
  54777 #else
  54778 __ai __attribute__((target("neon"))) int64x2_t vmull_high_s32(int32x4_t __p0, int32x4_t __p1) {
  54779   int64x2_t __ret;
  54780   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  54781   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  54782   __ret = __noswap_vmull_s32(__noswap_vget_high_s32(__rev0), __noswap_vget_high_s32(__rev1));
  54783   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54784   return __ret;
  54785 }
  54786 #endif
  54787 
  54788 #ifdef __LITTLE_ENDIAN__
  54789 __ai __attribute__((target("neon"))) int32x4_t vmull_high_s16(int16x8_t __p0, int16x8_t __p1) {
  54790   int32x4_t __ret;
  54791   __ret = vmull_s16(vget_high_s16(__p0), vget_high_s16(__p1));
  54792   return __ret;
  54793 }
  54794 #else
  54795 __ai __attribute__((target("neon"))) int32x4_t vmull_high_s16(int16x8_t __p0, int16x8_t __p1) {
  54796   int32x4_t __ret;
  54797   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  54798   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  54799   __ret = __noswap_vmull_s16(__noswap_vget_high_s16(__rev0), __noswap_vget_high_s16(__rev1));
  54800   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  54801   return __ret;
  54802 }
  54803 #endif
  54804 
  54805 #ifdef __LITTLE_ENDIAN__
  54806 #define vmull_high_lane_u32(__p0_585, __p1_585, __p2_585) __extension__ ({ \
  54807   uint64x2_t __ret_585; \
  54808   uint32x4_t __s0_585 = __p0_585; \
  54809   uint32x2_t __s1_585 = __p1_585; \
  54810   __ret_585 = vmull_u32(vget_high_u32(__s0_585), splat_lane_u32(__s1_585, __p2_585)); \
  54811   __ret_585; \
  54812 })
  54813 #else
  54814 #define vmull_high_lane_u32(__p0_586, __p1_586, __p2_586) __extension__ ({ \
  54815   uint64x2_t __ret_586; \
  54816   uint32x4_t __s0_586 = __p0_586; \
  54817   uint32x2_t __s1_586 = __p1_586; \
  54818   uint32x4_t __rev0_586;  __rev0_586 = __builtin_shufflevector(__s0_586, __s0_586, 3, 2, 1, 0); \
  54819   uint32x2_t __rev1_586;  __rev1_586 = __builtin_shufflevector(__s1_586, __s1_586, 1, 0); \
  54820   __ret_586 = __noswap_vmull_u32(__noswap_vget_high_u32(__rev0_586), __noswap_splat_lane_u32(__rev1_586, __p2_586)); \
  54821   __ret_586 = __builtin_shufflevector(__ret_586, __ret_586, 1, 0); \
  54822   __ret_586; \
  54823 })
  54824 #endif
  54825 
  54826 #ifdef __LITTLE_ENDIAN__
  54827 #define vmull_high_lane_u16(__p0_587, __p1_587, __p2_587) __extension__ ({ \
  54828   uint32x4_t __ret_587; \
  54829   uint16x8_t __s0_587 = __p0_587; \
  54830   uint16x4_t __s1_587 = __p1_587; \
  54831   __ret_587 = vmull_u16(vget_high_u16(__s0_587), splat_lane_u16(__s1_587, __p2_587)); \
  54832   __ret_587; \
  54833 })
  54834 #else
  54835 #define vmull_high_lane_u16(__p0_588, __p1_588, __p2_588) __extension__ ({ \
  54836   uint32x4_t __ret_588; \
  54837   uint16x8_t __s0_588 = __p0_588; \
  54838   uint16x4_t __s1_588 = __p1_588; \
  54839   uint16x8_t __rev0_588;  __rev0_588 = __builtin_shufflevector(__s0_588, __s0_588, 7, 6, 5, 4, 3, 2, 1, 0); \
  54840   uint16x4_t __rev1_588;  __rev1_588 = __builtin_shufflevector(__s1_588, __s1_588, 3, 2, 1, 0); \
  54841   __ret_588 = __noswap_vmull_u16(__noswap_vget_high_u16(__rev0_588), __noswap_splat_lane_u16(__rev1_588, __p2_588)); \
  54842   __ret_588 = __builtin_shufflevector(__ret_588, __ret_588, 3, 2, 1, 0); \
  54843   __ret_588; \
  54844 })
  54845 #endif
  54846 
  54847 #ifdef __LITTLE_ENDIAN__
  54848 #define vmull_high_lane_s32(__p0_589, __p1_589, __p2_589) __extension__ ({ \
  54849   int64x2_t __ret_589; \
  54850   int32x4_t __s0_589 = __p0_589; \
  54851   int32x2_t __s1_589 = __p1_589; \
  54852   __ret_589 = vmull_s32(vget_high_s32(__s0_589), splat_lane_s32(__s1_589, __p2_589)); \
  54853   __ret_589; \
  54854 })
  54855 #else
  54856 #define vmull_high_lane_s32(__p0_590, __p1_590, __p2_590) __extension__ ({ \
  54857   int64x2_t __ret_590; \
  54858   int32x4_t __s0_590 = __p0_590; \
  54859   int32x2_t __s1_590 = __p1_590; \
  54860   int32x4_t __rev0_590;  __rev0_590 = __builtin_shufflevector(__s0_590, __s0_590, 3, 2, 1, 0); \
  54861   int32x2_t __rev1_590;  __rev1_590 = __builtin_shufflevector(__s1_590, __s1_590, 1, 0); \
  54862   __ret_590 = __noswap_vmull_s32(__noswap_vget_high_s32(__rev0_590), __noswap_splat_lane_s32(__rev1_590, __p2_590)); \
  54863   __ret_590 = __builtin_shufflevector(__ret_590, __ret_590, 1, 0); \
  54864   __ret_590; \
  54865 })
  54866 #endif
  54867 
  54868 #ifdef __LITTLE_ENDIAN__
  54869 #define vmull_high_lane_s16(__p0_591, __p1_591, __p2_591) __extension__ ({ \
  54870   int32x4_t __ret_591; \
  54871   int16x8_t __s0_591 = __p0_591; \
  54872   int16x4_t __s1_591 = __p1_591; \
  54873   __ret_591 = vmull_s16(vget_high_s16(__s0_591), splat_lane_s16(__s1_591, __p2_591)); \
  54874   __ret_591; \
  54875 })
  54876 #else
  54877 #define vmull_high_lane_s16(__p0_592, __p1_592, __p2_592) __extension__ ({ \
  54878   int32x4_t __ret_592; \
  54879   int16x8_t __s0_592 = __p0_592; \
  54880   int16x4_t __s1_592 = __p1_592; \
  54881   int16x8_t __rev0_592;  __rev0_592 = __builtin_shufflevector(__s0_592, __s0_592, 7, 6, 5, 4, 3, 2, 1, 0); \
  54882   int16x4_t __rev1_592;  __rev1_592 = __builtin_shufflevector(__s1_592, __s1_592, 3, 2, 1, 0); \
  54883   __ret_592 = __noswap_vmull_s16(__noswap_vget_high_s16(__rev0_592), __noswap_splat_lane_s16(__rev1_592, __p2_592)); \
  54884   __ret_592 = __builtin_shufflevector(__ret_592, __ret_592, 3, 2, 1, 0); \
  54885   __ret_592; \
  54886 })
  54887 #endif
  54888 
  54889 #ifdef __LITTLE_ENDIAN__
  54890 #define vmull_high_laneq_u32(__p0_593, __p1_593, __p2_593) __extension__ ({ \
  54891   uint64x2_t __ret_593; \
  54892   uint32x4_t __s0_593 = __p0_593; \
  54893   uint32x4_t __s1_593 = __p1_593; \
  54894   __ret_593 = vmull_u32(vget_high_u32(__s0_593), splat_laneq_u32(__s1_593, __p2_593)); \
  54895   __ret_593; \
  54896 })
  54897 #else
  54898 #define vmull_high_laneq_u32(__p0_594, __p1_594, __p2_594) __extension__ ({ \
  54899   uint64x2_t __ret_594; \
  54900   uint32x4_t __s0_594 = __p0_594; \
  54901   uint32x4_t __s1_594 = __p1_594; \
  54902   uint32x4_t __rev0_594;  __rev0_594 = __builtin_shufflevector(__s0_594, __s0_594, 3, 2, 1, 0); \
  54903   uint32x4_t __rev1_594;  __rev1_594 = __builtin_shufflevector(__s1_594, __s1_594, 3, 2, 1, 0); \
  54904   __ret_594 = __noswap_vmull_u32(__noswap_vget_high_u32(__rev0_594), __noswap_splat_laneq_u32(__rev1_594, __p2_594)); \
  54905   __ret_594 = __builtin_shufflevector(__ret_594, __ret_594, 1, 0); \
  54906   __ret_594; \
  54907 })
  54908 #endif
  54909 
  54910 #ifdef __LITTLE_ENDIAN__
  54911 #define vmull_high_laneq_u16(__p0_595, __p1_595, __p2_595) __extension__ ({ \
  54912   uint32x4_t __ret_595; \
  54913   uint16x8_t __s0_595 = __p0_595; \
  54914   uint16x8_t __s1_595 = __p1_595; \
  54915   __ret_595 = vmull_u16(vget_high_u16(__s0_595), splat_laneq_u16(__s1_595, __p2_595)); \
  54916   __ret_595; \
  54917 })
  54918 #else
  54919 #define vmull_high_laneq_u16(__p0_596, __p1_596, __p2_596) __extension__ ({ \
  54920   uint32x4_t __ret_596; \
  54921   uint16x8_t __s0_596 = __p0_596; \
  54922   uint16x8_t __s1_596 = __p1_596; \
  54923   uint16x8_t __rev0_596;  __rev0_596 = __builtin_shufflevector(__s0_596, __s0_596, 7, 6, 5, 4, 3, 2, 1, 0); \
  54924   uint16x8_t __rev1_596;  __rev1_596 = __builtin_shufflevector(__s1_596, __s1_596, 7, 6, 5, 4, 3, 2, 1, 0); \
  54925   __ret_596 = __noswap_vmull_u16(__noswap_vget_high_u16(__rev0_596), __noswap_splat_laneq_u16(__rev1_596, __p2_596)); \
  54926   __ret_596 = __builtin_shufflevector(__ret_596, __ret_596, 3, 2, 1, 0); \
  54927   __ret_596; \
  54928 })
  54929 #endif
  54930 
  54931 #ifdef __LITTLE_ENDIAN__
  54932 #define vmull_high_laneq_s32(__p0_597, __p1_597, __p2_597) __extension__ ({ \
  54933   int64x2_t __ret_597; \
  54934   int32x4_t __s0_597 = __p0_597; \
  54935   int32x4_t __s1_597 = __p1_597; \
  54936   __ret_597 = vmull_s32(vget_high_s32(__s0_597), splat_laneq_s32(__s1_597, __p2_597)); \
  54937   __ret_597; \
  54938 })
  54939 #else
  54940 #define vmull_high_laneq_s32(__p0_598, __p1_598, __p2_598) __extension__ ({ \
  54941   int64x2_t __ret_598; \
  54942   int32x4_t __s0_598 = __p0_598; \
  54943   int32x4_t __s1_598 = __p1_598; \
  54944   int32x4_t __rev0_598;  __rev0_598 = __builtin_shufflevector(__s0_598, __s0_598, 3, 2, 1, 0); \
  54945   int32x4_t __rev1_598;  __rev1_598 = __builtin_shufflevector(__s1_598, __s1_598, 3, 2, 1, 0); \
  54946   __ret_598 = __noswap_vmull_s32(__noswap_vget_high_s32(__rev0_598), __noswap_splat_laneq_s32(__rev1_598, __p2_598)); \
  54947   __ret_598 = __builtin_shufflevector(__ret_598, __ret_598, 1, 0); \
  54948   __ret_598; \
  54949 })
  54950 #endif
  54951 
  54952 #ifdef __LITTLE_ENDIAN__
  54953 #define vmull_high_laneq_s16(__p0_599, __p1_599, __p2_599) __extension__ ({ \
  54954   int32x4_t __ret_599; \
  54955   int16x8_t __s0_599 = __p0_599; \
  54956   int16x8_t __s1_599 = __p1_599; \
  54957   __ret_599 = vmull_s16(vget_high_s16(__s0_599), splat_laneq_s16(__s1_599, __p2_599)); \
  54958   __ret_599; \
  54959 })
  54960 #else
  54961 #define vmull_high_laneq_s16(__p0_600, __p1_600, __p2_600) __extension__ ({ \
  54962   int32x4_t __ret_600; \
  54963   int16x8_t __s0_600 = __p0_600; \
  54964   int16x8_t __s1_600 = __p1_600; \
  54965   int16x8_t __rev0_600;  __rev0_600 = __builtin_shufflevector(__s0_600, __s0_600, 7, 6, 5, 4, 3, 2, 1, 0); \
  54966   int16x8_t __rev1_600;  __rev1_600 = __builtin_shufflevector(__s1_600, __s1_600, 7, 6, 5, 4, 3, 2, 1, 0); \
  54967   __ret_600 = __noswap_vmull_s16(__noswap_vget_high_s16(__rev0_600), __noswap_splat_laneq_s16(__rev1_600, __p2_600)); \
  54968   __ret_600 = __builtin_shufflevector(__ret_600, __ret_600, 3, 2, 1, 0); \
  54969   __ret_600; \
  54970 })
  54971 #endif
  54972 
  54973 #ifdef __LITTLE_ENDIAN__
  54974 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_n_u32(uint32x4_t __p0, uint32_t __p1) {
  54975   uint64x2_t __ret;
  54976   __ret = vmull_n_u32(vget_high_u32(__p0), __p1);
  54977   return __ret;
  54978 }
  54979 #else
  54980 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_n_u32(uint32x4_t __p0, uint32_t __p1) {
  54981   uint64x2_t __ret;
  54982   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  54983   __ret = __noswap_vmull_n_u32(__noswap_vget_high_u32(__rev0), __p1);
  54984   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  54985   return __ret;
  54986 }
  54987 #endif
  54988 
  54989 #ifdef __LITTLE_ENDIAN__
  54990 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_n_u16(uint16x8_t __p0, uint16_t __p1) {
  54991   uint32x4_t __ret;
  54992   __ret = vmull_n_u16(vget_high_u16(__p0), __p1);
  54993   return __ret;
  54994 }
  54995 #else
  54996 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_n_u16(uint16x8_t __p0, uint16_t __p1) {
  54997   uint32x4_t __ret;
  54998   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  54999   __ret = __noswap_vmull_n_u16(__noswap_vget_high_u16(__rev0), __p1);
  55000   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55001   return __ret;
  55002 }
  55003 #endif
  55004 
  55005 #ifdef __LITTLE_ENDIAN__
  55006 __ai __attribute__((target("neon"))) int64x2_t vmull_high_n_s32(int32x4_t __p0, int32_t __p1) {
  55007   int64x2_t __ret;
  55008   __ret = vmull_n_s32(vget_high_s32(__p0), __p1);
  55009   return __ret;
  55010 }
  55011 #else
  55012 __ai __attribute__((target("neon"))) int64x2_t vmull_high_n_s32(int32x4_t __p0, int32_t __p1) {
  55013   int64x2_t __ret;
  55014   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55015   __ret = __noswap_vmull_n_s32(__noswap_vget_high_s32(__rev0), __p1);
  55016   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55017   return __ret;
  55018 }
  55019 #endif
  55020 
  55021 #ifdef __LITTLE_ENDIAN__
  55022 __ai __attribute__((target("neon"))) int32x4_t vmull_high_n_s16(int16x8_t __p0, int16_t __p1) {
  55023   int32x4_t __ret;
  55024   __ret = vmull_n_s16(vget_high_s16(__p0), __p1);
  55025   return __ret;
  55026 }
  55027 #else
  55028 __ai __attribute__((target("neon"))) int32x4_t vmull_high_n_s16(int16x8_t __p0, int16_t __p1) {
  55029   int32x4_t __ret;
  55030   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  55031   __ret = __noswap_vmull_n_s16(__noswap_vget_high_s16(__rev0), __p1);
  55032   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55033   return __ret;
  55034 }
  55035 #endif
  55036 
  55037 #ifdef __LITTLE_ENDIAN__
  55038 #define vmull_laneq_u32(__p0_601, __p1_601, __p2_601) __extension__ ({ \
  55039   uint64x2_t __ret_601; \
  55040   uint32x2_t __s0_601 = __p0_601; \
  55041   uint32x4_t __s1_601 = __p1_601; \
  55042   __ret_601 = vmull_u32(__s0_601, splat_laneq_u32(__s1_601, __p2_601)); \
  55043   __ret_601; \
  55044 })
  55045 #else
  55046 #define vmull_laneq_u32(__p0_602, __p1_602, __p2_602) __extension__ ({ \
  55047   uint64x2_t __ret_602; \
  55048   uint32x2_t __s0_602 = __p0_602; \
  55049   uint32x4_t __s1_602 = __p1_602; \
  55050   uint32x2_t __rev0_602;  __rev0_602 = __builtin_shufflevector(__s0_602, __s0_602, 1, 0); \
  55051   uint32x4_t __rev1_602;  __rev1_602 = __builtin_shufflevector(__s1_602, __s1_602, 3, 2, 1, 0); \
  55052   __ret_602 = __noswap_vmull_u32(__rev0_602, __noswap_splat_laneq_u32(__rev1_602, __p2_602)); \
  55053   __ret_602 = __builtin_shufflevector(__ret_602, __ret_602, 1, 0); \
  55054   __ret_602; \
  55055 })
  55056 #endif
  55057 
  55058 #ifdef __LITTLE_ENDIAN__
  55059 #define vmull_laneq_u16(__p0_603, __p1_603, __p2_603) __extension__ ({ \
  55060   uint32x4_t __ret_603; \
  55061   uint16x4_t __s0_603 = __p0_603; \
  55062   uint16x8_t __s1_603 = __p1_603; \
  55063   __ret_603 = vmull_u16(__s0_603, splat_laneq_u16(__s1_603, __p2_603)); \
  55064   __ret_603; \
  55065 })
  55066 #else
  55067 #define vmull_laneq_u16(__p0_604, __p1_604, __p2_604) __extension__ ({ \
  55068   uint32x4_t __ret_604; \
  55069   uint16x4_t __s0_604 = __p0_604; \
  55070   uint16x8_t __s1_604 = __p1_604; \
  55071   uint16x4_t __rev0_604;  __rev0_604 = __builtin_shufflevector(__s0_604, __s0_604, 3, 2, 1, 0); \
  55072   uint16x8_t __rev1_604;  __rev1_604 = __builtin_shufflevector(__s1_604, __s1_604, 7, 6, 5, 4, 3, 2, 1, 0); \
  55073   __ret_604 = __noswap_vmull_u16(__rev0_604, __noswap_splat_laneq_u16(__rev1_604, __p2_604)); \
  55074   __ret_604 = __builtin_shufflevector(__ret_604, __ret_604, 3, 2, 1, 0); \
  55075   __ret_604; \
  55076 })
  55077 #endif
  55078 
  55079 #ifdef __LITTLE_ENDIAN__
  55080 #define vmull_laneq_s32(__p0_605, __p1_605, __p2_605) __extension__ ({ \
  55081   int64x2_t __ret_605; \
  55082   int32x2_t __s0_605 = __p0_605; \
  55083   int32x4_t __s1_605 = __p1_605; \
  55084   __ret_605 = vmull_s32(__s0_605, splat_laneq_s32(__s1_605, __p2_605)); \
  55085   __ret_605; \
  55086 })
  55087 #else
  55088 #define vmull_laneq_s32(__p0_606, __p1_606, __p2_606) __extension__ ({ \
  55089   int64x2_t __ret_606; \
  55090   int32x2_t __s0_606 = __p0_606; \
  55091   int32x4_t __s1_606 = __p1_606; \
  55092   int32x2_t __rev0_606;  __rev0_606 = __builtin_shufflevector(__s0_606, __s0_606, 1, 0); \
  55093   int32x4_t __rev1_606;  __rev1_606 = __builtin_shufflevector(__s1_606, __s1_606, 3, 2, 1, 0); \
  55094   __ret_606 = __noswap_vmull_s32(__rev0_606, __noswap_splat_laneq_s32(__rev1_606, __p2_606)); \
  55095   __ret_606 = __builtin_shufflevector(__ret_606, __ret_606, 1, 0); \
  55096   __ret_606; \
  55097 })
  55098 #endif
  55099 
  55100 #ifdef __LITTLE_ENDIAN__
  55101 #define vmull_laneq_s16(__p0_607, __p1_607, __p2_607) __extension__ ({ \
  55102   int32x4_t __ret_607; \
  55103   int16x4_t __s0_607 = __p0_607; \
  55104   int16x8_t __s1_607 = __p1_607; \
  55105   __ret_607 = vmull_s16(__s0_607, splat_laneq_s16(__s1_607, __p2_607)); \
  55106   __ret_607; \
  55107 })
  55108 #else
  55109 #define vmull_laneq_s16(__p0_608, __p1_608, __p2_608) __extension__ ({ \
  55110   int32x4_t __ret_608; \
  55111   int16x4_t __s0_608 = __p0_608; \
  55112   int16x8_t __s1_608 = __p1_608; \
  55113   int16x4_t __rev0_608;  __rev0_608 = __builtin_shufflevector(__s0_608, __s0_608, 3, 2, 1, 0); \
  55114   int16x8_t __rev1_608;  __rev1_608 = __builtin_shufflevector(__s1_608, __s1_608, 7, 6, 5, 4, 3, 2, 1, 0); \
  55115   __ret_608 = __noswap_vmull_s16(__rev0_608, __noswap_splat_laneq_s16(__rev1_608, __p2_608)); \
  55116   __ret_608 = __builtin_shufflevector(__ret_608, __ret_608, 3, 2, 1, 0); \
  55117   __ret_608; \
  55118 })
  55119 #endif
  55120 
  55121 #ifdef __LITTLE_ENDIAN__
  55122 __ai __attribute__((target("neon"))) float64x2_t vmulxq_f64(float64x2_t __p0, float64x2_t __p1) {
  55123   float64x2_t __ret;
  55124   __ret = (float64x2_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  55125   return __ret;
  55126 }
  55127 #else
  55128 __ai __attribute__((target("neon"))) float64x2_t vmulxq_f64(float64x2_t __p0, float64x2_t __p1) {
  55129   float64x2_t __ret;
  55130   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55131   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55132   __ret = (float64x2_t) __builtin_neon_vmulxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  55133   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55134   return __ret;
  55135 }
  55136 __ai __attribute__((target("neon"))) float64x2_t __noswap_vmulxq_f64(float64x2_t __p0, float64x2_t __p1) {
  55137   float64x2_t __ret;
  55138   __ret = (float64x2_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  55139   return __ret;
  55140 }
  55141 #endif
  55142 
  55143 #ifdef __LITTLE_ENDIAN__
  55144 __ai __attribute__((target("neon"))) float32x4_t vmulxq_f32(float32x4_t __p0, float32x4_t __p1) {
  55145   float32x4_t __ret;
  55146   __ret = (float32x4_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  55147   return __ret;
  55148 }
  55149 #else
  55150 __ai __attribute__((target("neon"))) float32x4_t vmulxq_f32(float32x4_t __p0, float32x4_t __p1) {
  55151   float32x4_t __ret;
  55152   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55153   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55154   __ret = (float32x4_t) __builtin_neon_vmulxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  55155   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55156   return __ret;
  55157 }
  55158 __ai __attribute__((target("neon"))) float32x4_t __noswap_vmulxq_f32(float32x4_t __p0, float32x4_t __p1) {
  55159   float32x4_t __ret;
  55160   __ret = (float32x4_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  55161   return __ret;
  55162 }
  55163 #endif
  55164 
  55165 __ai __attribute__((target("neon"))) float64x1_t vmulx_f64(float64x1_t __p0, float64x1_t __p1) {
  55166   float64x1_t __ret;
  55167   __ret = (float64x1_t) __builtin_neon_vmulx_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  55168   return __ret;
  55169 }
  55170 #ifdef __LITTLE_ENDIAN__
  55171 __ai __attribute__((target("neon"))) float32x2_t vmulx_f32(float32x2_t __p0, float32x2_t __p1) {
  55172   float32x2_t __ret;
  55173   __ret = (float32x2_t) __builtin_neon_vmulx_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  55174   return __ret;
  55175 }
  55176 #else
  55177 __ai __attribute__((target("neon"))) float32x2_t vmulx_f32(float32x2_t __p0, float32x2_t __p1) {
  55178   float32x2_t __ret;
  55179   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55180   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55181   __ret = (float32x2_t) __builtin_neon_vmulx_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  55182   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55183   return __ret;
  55184 }
  55185 __ai __attribute__((target("neon"))) float32x2_t __noswap_vmulx_f32(float32x2_t __p0, float32x2_t __p1) {
  55186   float32x2_t __ret;
  55187   __ret = (float32x2_t) __builtin_neon_vmulx_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  55188   return __ret;
  55189 }
  55190 #endif
  55191 
  55192 __ai __attribute__((target("neon"))) float64_t vmulxd_f64(float64_t __p0, float64_t __p1) {
  55193   float64_t __ret;
  55194   __ret = (float64_t) __builtin_neon_vmulxd_f64(__p0, __p1);
  55195   return __ret;
  55196 }
  55197 __ai __attribute__((target("neon"))) float32_t vmulxs_f32(float32_t __p0, float32_t __p1) {
  55198   float32_t __ret;
  55199   __ret = (float32_t) __builtin_neon_vmulxs_f32(__p0, __p1);
  55200   return __ret;
  55201 }
  55202 #define vmulxd_lane_f64(__p0_609, __p1_609, __p2_609) __extension__ ({ \
  55203   float64_t __ret_609; \
  55204   float64_t __s0_609 = __p0_609; \
  55205   float64x1_t __s1_609 = __p1_609; \
  55206   __ret_609 = vmulxd_f64(__s0_609, vget_lane_f64(__s1_609, __p2_609)); \
  55207   __ret_609; \
  55208 })
  55209 #ifdef __LITTLE_ENDIAN__
  55210 #define vmulxs_lane_f32(__p0_610, __p1_610, __p2_610) __extension__ ({ \
  55211   float32_t __ret_610; \
  55212   float32_t __s0_610 = __p0_610; \
  55213   float32x2_t __s1_610 = __p1_610; \
  55214   __ret_610 = vmulxs_f32(__s0_610, vget_lane_f32(__s1_610, __p2_610)); \
  55215   __ret_610; \
  55216 })
  55217 #else
  55218 #define vmulxs_lane_f32(__p0_611, __p1_611, __p2_611) __extension__ ({ \
  55219   float32_t __ret_611; \
  55220   float32_t __s0_611 = __p0_611; \
  55221   float32x2_t __s1_611 = __p1_611; \
  55222   float32x2_t __rev1_611;  __rev1_611 = __builtin_shufflevector(__s1_611, __s1_611, 1, 0); \
  55223   __ret_611 = vmulxs_f32(__s0_611, __noswap_vget_lane_f32(__rev1_611, __p2_611)); \
  55224   __ret_611; \
  55225 })
  55226 #endif
  55227 
  55228 #ifdef __LITTLE_ENDIAN__
  55229 #define vmulxq_lane_f64(__p0_612, __p1_612, __p2_612) __extension__ ({ \
  55230   float64x2_t __ret_612; \
  55231   float64x2_t __s0_612 = __p0_612; \
  55232   float64x1_t __s1_612 = __p1_612; \
  55233   __ret_612 = vmulxq_f64(__s0_612, splatq_lane_f64(__s1_612, __p2_612)); \
  55234   __ret_612; \
  55235 })
  55236 #else
  55237 #define vmulxq_lane_f64(__p0_613, __p1_613, __p2_613) __extension__ ({ \
  55238   float64x2_t __ret_613; \
  55239   float64x2_t __s0_613 = __p0_613; \
  55240   float64x1_t __s1_613 = __p1_613; \
  55241   float64x2_t __rev0_613;  __rev0_613 = __builtin_shufflevector(__s0_613, __s0_613, 1, 0); \
  55242   __ret_613 = __noswap_vmulxq_f64(__rev0_613, __noswap_splatq_lane_f64(__s1_613, __p2_613)); \
  55243   __ret_613 = __builtin_shufflevector(__ret_613, __ret_613, 1, 0); \
  55244   __ret_613; \
  55245 })
  55246 #endif
  55247 
  55248 #ifdef __LITTLE_ENDIAN__
  55249 #define vmulxq_lane_f32(__p0_614, __p1_614, __p2_614) __extension__ ({ \
  55250   float32x4_t __ret_614; \
  55251   float32x4_t __s0_614 = __p0_614; \
  55252   float32x2_t __s1_614 = __p1_614; \
  55253   __ret_614 = vmulxq_f32(__s0_614, splatq_lane_f32(__s1_614, __p2_614)); \
  55254   __ret_614; \
  55255 })
  55256 #else
  55257 #define vmulxq_lane_f32(__p0_615, __p1_615, __p2_615) __extension__ ({ \
  55258   float32x4_t __ret_615; \
  55259   float32x4_t __s0_615 = __p0_615; \
  55260   float32x2_t __s1_615 = __p1_615; \
  55261   float32x4_t __rev0_615;  __rev0_615 = __builtin_shufflevector(__s0_615, __s0_615, 3, 2, 1, 0); \
  55262   float32x2_t __rev1_615;  __rev1_615 = __builtin_shufflevector(__s1_615, __s1_615, 1, 0); \
  55263   __ret_615 = __noswap_vmulxq_f32(__rev0_615, __noswap_splatq_lane_f32(__rev1_615, __p2_615)); \
  55264   __ret_615 = __builtin_shufflevector(__ret_615, __ret_615, 3, 2, 1, 0); \
  55265   __ret_615; \
  55266 })
  55267 #endif
  55268 
  55269 #ifdef __LITTLE_ENDIAN__
  55270 #define vmulx_lane_f32(__p0_616, __p1_616, __p2_616) __extension__ ({ \
  55271   float32x2_t __ret_616; \
  55272   float32x2_t __s0_616 = __p0_616; \
  55273   float32x2_t __s1_616 = __p1_616; \
  55274   __ret_616 = vmulx_f32(__s0_616, splat_lane_f32(__s1_616, __p2_616)); \
  55275   __ret_616; \
  55276 })
  55277 #else
  55278 #define vmulx_lane_f32(__p0_617, __p1_617, __p2_617) __extension__ ({ \
  55279   float32x2_t __ret_617; \
  55280   float32x2_t __s0_617 = __p0_617; \
  55281   float32x2_t __s1_617 = __p1_617; \
  55282   float32x2_t __rev0_617;  __rev0_617 = __builtin_shufflevector(__s0_617, __s0_617, 1, 0); \
  55283   float32x2_t __rev1_617;  __rev1_617 = __builtin_shufflevector(__s1_617, __s1_617, 1, 0); \
  55284   __ret_617 = __noswap_vmulx_f32(__rev0_617, __noswap_splat_lane_f32(__rev1_617, __p2_617)); \
  55285   __ret_617 = __builtin_shufflevector(__ret_617, __ret_617, 1, 0); \
  55286   __ret_617; \
  55287 })
  55288 #endif
  55289 
  55290 #ifdef __LITTLE_ENDIAN__
  55291 #define vmulxd_laneq_f64(__p0_618, __p1_618, __p2_618) __extension__ ({ \
  55292   float64_t __ret_618; \
  55293   float64_t __s0_618 = __p0_618; \
  55294   float64x2_t __s1_618 = __p1_618; \
  55295   __ret_618 = vmulxd_f64(__s0_618, vgetq_lane_f64(__s1_618, __p2_618)); \
  55296   __ret_618; \
  55297 })
  55298 #else
  55299 #define vmulxd_laneq_f64(__p0_619, __p1_619, __p2_619) __extension__ ({ \
  55300   float64_t __ret_619; \
  55301   float64_t __s0_619 = __p0_619; \
  55302   float64x2_t __s1_619 = __p1_619; \
  55303   float64x2_t __rev1_619;  __rev1_619 = __builtin_shufflevector(__s1_619, __s1_619, 1, 0); \
  55304   __ret_619 = vmulxd_f64(__s0_619, __noswap_vgetq_lane_f64(__rev1_619, __p2_619)); \
  55305   __ret_619; \
  55306 })
  55307 #endif
  55308 
  55309 #ifdef __LITTLE_ENDIAN__
  55310 #define vmulxs_laneq_f32(__p0_620, __p1_620, __p2_620) __extension__ ({ \
  55311   float32_t __ret_620; \
  55312   float32_t __s0_620 = __p0_620; \
  55313   float32x4_t __s1_620 = __p1_620; \
  55314   __ret_620 = vmulxs_f32(__s0_620, vgetq_lane_f32(__s1_620, __p2_620)); \
  55315   __ret_620; \
  55316 })
  55317 #else
  55318 #define vmulxs_laneq_f32(__p0_621, __p1_621, __p2_621) __extension__ ({ \
  55319   float32_t __ret_621; \
  55320   float32_t __s0_621 = __p0_621; \
  55321   float32x4_t __s1_621 = __p1_621; \
  55322   float32x4_t __rev1_621;  __rev1_621 = __builtin_shufflevector(__s1_621, __s1_621, 3, 2, 1, 0); \
  55323   __ret_621 = vmulxs_f32(__s0_621, __noswap_vgetq_lane_f32(__rev1_621, __p2_621)); \
  55324   __ret_621; \
  55325 })
  55326 #endif
  55327 
  55328 #ifdef __LITTLE_ENDIAN__
  55329 #define vmulxq_laneq_f64(__p0_622, __p1_622, __p2_622) __extension__ ({ \
  55330   float64x2_t __ret_622; \
  55331   float64x2_t __s0_622 = __p0_622; \
  55332   float64x2_t __s1_622 = __p1_622; \
  55333   __ret_622 = vmulxq_f64(__s0_622, splatq_laneq_f64(__s1_622, __p2_622)); \
  55334   __ret_622; \
  55335 })
  55336 #else
  55337 #define vmulxq_laneq_f64(__p0_623, __p1_623, __p2_623) __extension__ ({ \
  55338   float64x2_t __ret_623; \
  55339   float64x2_t __s0_623 = __p0_623; \
  55340   float64x2_t __s1_623 = __p1_623; \
  55341   float64x2_t __rev0_623;  __rev0_623 = __builtin_shufflevector(__s0_623, __s0_623, 1, 0); \
  55342   float64x2_t __rev1_623;  __rev1_623 = __builtin_shufflevector(__s1_623, __s1_623, 1, 0); \
  55343   __ret_623 = __noswap_vmulxq_f64(__rev0_623, __noswap_splatq_laneq_f64(__rev1_623, __p2_623)); \
  55344   __ret_623 = __builtin_shufflevector(__ret_623, __ret_623, 1, 0); \
  55345   __ret_623; \
  55346 })
  55347 #endif
  55348 
  55349 #ifdef __LITTLE_ENDIAN__
  55350 #define vmulxq_laneq_f32(__p0_624, __p1_624, __p2_624) __extension__ ({ \
  55351   float32x4_t __ret_624; \
  55352   float32x4_t __s0_624 = __p0_624; \
  55353   float32x4_t __s1_624 = __p1_624; \
  55354   __ret_624 = vmulxq_f32(__s0_624, splatq_laneq_f32(__s1_624, __p2_624)); \
  55355   __ret_624; \
  55356 })
  55357 #else
  55358 #define vmulxq_laneq_f32(__p0_625, __p1_625, __p2_625) __extension__ ({ \
  55359   float32x4_t __ret_625; \
  55360   float32x4_t __s0_625 = __p0_625; \
  55361   float32x4_t __s1_625 = __p1_625; \
  55362   float32x4_t __rev0_625;  __rev0_625 = __builtin_shufflevector(__s0_625, __s0_625, 3, 2, 1, 0); \
  55363   float32x4_t __rev1_625;  __rev1_625 = __builtin_shufflevector(__s1_625, __s1_625, 3, 2, 1, 0); \
  55364   __ret_625 = __noswap_vmulxq_f32(__rev0_625, __noswap_splatq_laneq_f32(__rev1_625, __p2_625)); \
  55365   __ret_625 = __builtin_shufflevector(__ret_625, __ret_625, 3, 2, 1, 0); \
  55366   __ret_625; \
  55367 })
  55368 #endif
  55369 
  55370 #ifdef __LITTLE_ENDIAN__
  55371 #define vmulx_laneq_f32(__p0_626, __p1_626, __p2_626) __extension__ ({ \
  55372   float32x2_t __ret_626; \
  55373   float32x2_t __s0_626 = __p0_626; \
  55374   float32x4_t __s1_626 = __p1_626; \
  55375   __ret_626 = vmulx_f32(__s0_626, splat_laneq_f32(__s1_626, __p2_626)); \
  55376   __ret_626; \
  55377 })
  55378 #else
  55379 #define vmulx_laneq_f32(__p0_627, __p1_627, __p2_627) __extension__ ({ \
  55380   float32x2_t __ret_627; \
  55381   float32x2_t __s0_627 = __p0_627; \
  55382   float32x4_t __s1_627 = __p1_627; \
  55383   float32x2_t __rev0_627;  __rev0_627 = __builtin_shufflevector(__s0_627, __s0_627, 1, 0); \
  55384   float32x4_t __rev1_627;  __rev1_627 = __builtin_shufflevector(__s1_627, __s1_627, 3, 2, 1, 0); \
  55385   __ret_627 = __noswap_vmulx_f32(__rev0_627, __noswap_splat_laneq_f32(__rev1_627, __p2_627)); \
  55386   __ret_627 = __builtin_shufflevector(__ret_627, __ret_627, 1, 0); \
  55387   __ret_627; \
  55388 })
  55389 #endif
  55390 
  55391 #ifdef __LITTLE_ENDIAN__
  55392 __ai __attribute__((target("neon"))) float64x2_t vnegq_f64(float64x2_t __p0) {
  55393   float64x2_t __ret;
  55394   __ret = -__p0;
  55395   return __ret;
  55396 }
  55397 #else
  55398 __ai __attribute__((target("neon"))) float64x2_t vnegq_f64(float64x2_t __p0) {
  55399   float64x2_t __ret;
  55400   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55401   __ret = -__rev0;
  55402   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55403   return __ret;
  55404 }
  55405 #endif
  55406 
  55407 #ifdef __LITTLE_ENDIAN__
  55408 __ai __attribute__((target("neon"))) int64x2_t vnegq_s64(int64x2_t __p0) {
  55409   int64x2_t __ret;
  55410   __ret = -__p0;
  55411   return __ret;
  55412 }
  55413 #else
  55414 __ai __attribute__((target("neon"))) int64x2_t vnegq_s64(int64x2_t __p0) {
  55415   int64x2_t __ret;
  55416   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55417   __ret = -__rev0;
  55418   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55419   return __ret;
  55420 }
  55421 #endif
  55422 
  55423 __ai __attribute__((target("neon"))) float64x1_t vneg_f64(float64x1_t __p0) {
  55424   float64x1_t __ret;
  55425   __ret = -__p0;
  55426   return __ret;
  55427 }
  55428 __ai __attribute__((target("neon"))) int64x1_t vneg_s64(int64x1_t __p0) {
  55429   int64x1_t __ret;
  55430   __ret = -__p0;
  55431   return __ret;
  55432 }
  55433 __ai __attribute__((target("neon"))) int64_t vnegd_s64(int64_t __p0) {
  55434   int64_t __ret;
  55435   __ret = (int64_t) __builtin_neon_vnegd_s64(__p0);
  55436   return __ret;
  55437 }
  55438 #ifdef __LITTLE_ENDIAN__
  55439 __ai __attribute__((target("neon"))) uint8x16_t vpaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  55440   uint8x16_t __ret;
  55441   __ret = (uint8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  55442   return __ret;
  55443 }
  55444 #else
  55445 __ai __attribute__((target("neon"))) uint8x16_t vpaddq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  55446   uint8x16_t __ret;
  55447   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55448   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55449   __ret = (uint8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  55450   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55451   return __ret;
  55452 }
  55453 #endif
  55454 
  55455 #ifdef __LITTLE_ENDIAN__
  55456 __ai __attribute__((target("neon"))) uint32x4_t vpaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  55457   uint32x4_t __ret;
  55458   __ret = (uint32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  55459   return __ret;
  55460 }
  55461 #else
  55462 __ai __attribute__((target("neon"))) uint32x4_t vpaddq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  55463   uint32x4_t __ret;
  55464   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55465   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55466   __ret = (uint32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  55467   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55468   return __ret;
  55469 }
  55470 #endif
  55471 
  55472 #ifdef __LITTLE_ENDIAN__
  55473 __ai __attribute__((target("neon"))) uint64x2_t vpaddq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  55474   uint64x2_t __ret;
  55475   __ret = (uint64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  55476   return __ret;
  55477 }
  55478 #else
  55479 __ai __attribute__((target("neon"))) uint64x2_t vpaddq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  55480   uint64x2_t __ret;
  55481   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55482   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55483   __ret = (uint64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  55484   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55485   return __ret;
  55486 }
  55487 #endif
  55488 
  55489 #ifdef __LITTLE_ENDIAN__
  55490 __ai __attribute__((target("neon"))) uint16x8_t vpaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  55491   uint16x8_t __ret;
  55492   __ret = (uint16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  55493   return __ret;
  55494 }
  55495 #else
  55496 __ai __attribute__((target("neon"))) uint16x8_t vpaddq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  55497   uint16x8_t __ret;
  55498   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  55499   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  55500   __ret = (uint16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  55501   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  55502   return __ret;
  55503 }
  55504 #endif
  55505 
  55506 #ifdef __LITTLE_ENDIAN__
  55507 __ai __attribute__((target("neon"))) int8x16_t vpaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  55508   int8x16_t __ret;
  55509   __ret = (int8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  55510   return __ret;
  55511 }
  55512 #else
  55513 __ai __attribute__((target("neon"))) int8x16_t vpaddq_s8(int8x16_t __p0, int8x16_t __p1) {
  55514   int8x16_t __ret;
  55515   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55516   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55517   __ret = (int8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  55518   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55519   return __ret;
  55520 }
  55521 #endif
  55522 
  55523 #ifdef __LITTLE_ENDIAN__
  55524 __ai __attribute__((target("neon"))) float64x2_t vpaddq_f64(float64x2_t __p0, float64x2_t __p1) {
  55525   float64x2_t __ret;
  55526   __ret = (float64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  55527   return __ret;
  55528 }
  55529 #else
  55530 __ai __attribute__((target("neon"))) float64x2_t vpaddq_f64(float64x2_t __p0, float64x2_t __p1) {
  55531   float64x2_t __ret;
  55532   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55533   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55534   __ret = (float64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  55535   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55536   return __ret;
  55537 }
  55538 #endif
  55539 
  55540 #ifdef __LITTLE_ENDIAN__
  55541 __ai __attribute__((target("neon"))) float32x4_t vpaddq_f32(float32x4_t __p0, float32x4_t __p1) {
  55542   float32x4_t __ret;
  55543   __ret = (float32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  55544   return __ret;
  55545 }
  55546 #else
  55547 __ai __attribute__((target("neon"))) float32x4_t vpaddq_f32(float32x4_t __p0, float32x4_t __p1) {
  55548   float32x4_t __ret;
  55549   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55550   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55551   __ret = (float32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  55552   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55553   return __ret;
  55554 }
  55555 #endif
  55556 
  55557 #ifdef __LITTLE_ENDIAN__
  55558 __ai __attribute__((target("neon"))) int32x4_t vpaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  55559   int32x4_t __ret;
  55560   __ret = (int32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  55561   return __ret;
  55562 }
  55563 #else
  55564 __ai __attribute__((target("neon"))) int32x4_t vpaddq_s32(int32x4_t __p0, int32x4_t __p1) {
  55565   int32x4_t __ret;
  55566   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55567   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55568   __ret = (int32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  55569   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55570   return __ret;
  55571 }
  55572 #endif
  55573 
  55574 #ifdef __LITTLE_ENDIAN__
  55575 __ai __attribute__((target("neon"))) int64x2_t vpaddq_s64(int64x2_t __p0, int64x2_t __p1) {
  55576   int64x2_t __ret;
  55577   __ret = (int64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  55578   return __ret;
  55579 }
  55580 #else
  55581 __ai __attribute__((target("neon"))) int64x2_t vpaddq_s64(int64x2_t __p0, int64x2_t __p1) {
  55582   int64x2_t __ret;
  55583   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55584   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55585   __ret = (int64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  55586   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55587   return __ret;
  55588 }
  55589 #endif
  55590 
  55591 #ifdef __LITTLE_ENDIAN__
  55592 __ai __attribute__((target("neon"))) int16x8_t vpaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  55593   int16x8_t __ret;
  55594   __ret = (int16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  55595   return __ret;
  55596 }
  55597 #else
  55598 __ai __attribute__((target("neon"))) int16x8_t vpaddq_s16(int16x8_t __p0, int16x8_t __p1) {
  55599   int16x8_t __ret;
  55600   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  55601   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  55602   __ret = (int16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  55603   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  55604   return __ret;
  55605 }
  55606 #endif
  55607 
  55608 #ifdef __LITTLE_ENDIAN__
  55609 __ai __attribute__((target("neon"))) uint64_t vpaddd_u64(uint64x2_t __p0) {
  55610   uint64_t __ret;
  55611   __ret = (uint64_t) __builtin_neon_vpaddd_u64(__p0);
  55612   return __ret;
  55613 }
  55614 #else
  55615 __ai __attribute__((target("neon"))) uint64_t vpaddd_u64(uint64x2_t __p0) {
  55616   uint64_t __ret;
  55617   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55618   __ret = (uint64_t) __builtin_neon_vpaddd_u64(__rev0);
  55619   return __ret;
  55620 }
  55621 #endif
  55622 
  55623 #ifdef __LITTLE_ENDIAN__
  55624 __ai __attribute__((target("neon"))) float64_t vpaddd_f64(float64x2_t __p0) {
  55625   float64_t __ret;
  55626   __ret = (float64_t) __builtin_neon_vpaddd_f64(__p0);
  55627   return __ret;
  55628 }
  55629 #else
  55630 __ai __attribute__((target("neon"))) float64_t vpaddd_f64(float64x2_t __p0) {
  55631   float64_t __ret;
  55632   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55633   __ret = (float64_t) __builtin_neon_vpaddd_f64(__rev0);
  55634   return __ret;
  55635 }
  55636 #endif
  55637 
  55638 #ifdef __LITTLE_ENDIAN__
  55639 __ai __attribute__((target("neon"))) int64_t vpaddd_s64(int64x2_t __p0) {
  55640   int64_t __ret;
  55641   __ret = (int64_t) __builtin_neon_vpaddd_s64(__p0);
  55642   return __ret;
  55643 }
  55644 #else
  55645 __ai __attribute__((target("neon"))) int64_t vpaddd_s64(int64x2_t __p0) {
  55646   int64_t __ret;
  55647   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55648   __ret = (int64_t) __builtin_neon_vpaddd_s64(__rev0);
  55649   return __ret;
  55650 }
  55651 #endif
  55652 
  55653 #ifdef __LITTLE_ENDIAN__
  55654 __ai __attribute__((target("neon"))) float32_t vpadds_f32(float32x2_t __p0) {
  55655   float32_t __ret;
  55656   __ret = (float32_t) __builtin_neon_vpadds_f32(__p0);
  55657   return __ret;
  55658 }
  55659 #else
  55660 __ai __attribute__((target("neon"))) float32_t vpadds_f32(float32x2_t __p0) {
  55661   float32_t __ret;
  55662   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55663   __ret = (float32_t) __builtin_neon_vpadds_f32(__rev0);
  55664   return __ret;
  55665 }
  55666 #endif
  55667 
  55668 #ifdef __LITTLE_ENDIAN__
  55669 __ai __attribute__((target("neon"))) uint8x16_t vpmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  55670   uint8x16_t __ret;
  55671   __ret = (uint8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  55672   return __ret;
  55673 }
  55674 #else
  55675 __ai __attribute__((target("neon"))) uint8x16_t vpmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  55676   uint8x16_t __ret;
  55677   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55678   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55679   __ret = (uint8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  55680   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55681   return __ret;
  55682 }
  55683 #endif
  55684 
  55685 #ifdef __LITTLE_ENDIAN__
  55686 __ai __attribute__((target("neon"))) uint32x4_t vpmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  55687   uint32x4_t __ret;
  55688   __ret = (uint32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  55689   return __ret;
  55690 }
  55691 #else
  55692 __ai __attribute__((target("neon"))) uint32x4_t vpmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  55693   uint32x4_t __ret;
  55694   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55695   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55696   __ret = (uint32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  55697   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55698   return __ret;
  55699 }
  55700 #endif
  55701 
  55702 #ifdef __LITTLE_ENDIAN__
  55703 __ai __attribute__((target("neon"))) uint16x8_t vpmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  55704   uint16x8_t __ret;
  55705   __ret = (uint16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  55706   return __ret;
  55707 }
  55708 #else
  55709 __ai __attribute__((target("neon"))) uint16x8_t vpmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  55710   uint16x8_t __ret;
  55711   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  55712   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  55713   __ret = (uint16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  55714   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  55715   return __ret;
  55716 }
  55717 #endif
  55718 
  55719 #ifdef __LITTLE_ENDIAN__
  55720 __ai __attribute__((target("neon"))) int8x16_t vpmaxq_s8(int8x16_t __p0, int8x16_t __p1) {
  55721   int8x16_t __ret;
  55722   __ret = (int8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  55723   return __ret;
  55724 }
  55725 #else
  55726 __ai __attribute__((target("neon"))) int8x16_t vpmaxq_s8(int8x16_t __p0, int8x16_t __p1) {
  55727   int8x16_t __ret;
  55728   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55729   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55730   __ret = (int8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  55731   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55732   return __ret;
  55733 }
  55734 #endif
  55735 
  55736 #ifdef __LITTLE_ENDIAN__
  55737 __ai __attribute__((target("neon"))) float64x2_t vpmaxq_f64(float64x2_t __p0, float64x2_t __p1) {
  55738   float64x2_t __ret;
  55739   __ret = (float64x2_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  55740   return __ret;
  55741 }
  55742 #else
  55743 __ai __attribute__((target("neon"))) float64x2_t vpmaxq_f64(float64x2_t __p0, float64x2_t __p1) {
  55744   float64x2_t __ret;
  55745   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55746   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55747   __ret = (float64x2_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  55748   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55749   return __ret;
  55750 }
  55751 #endif
  55752 
  55753 #ifdef __LITTLE_ENDIAN__
  55754 __ai __attribute__((target("neon"))) float32x4_t vpmaxq_f32(float32x4_t __p0, float32x4_t __p1) {
  55755   float32x4_t __ret;
  55756   __ret = (float32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  55757   return __ret;
  55758 }
  55759 #else
  55760 __ai __attribute__((target("neon"))) float32x4_t vpmaxq_f32(float32x4_t __p0, float32x4_t __p1) {
  55761   float32x4_t __ret;
  55762   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55763   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55764   __ret = (float32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  55765   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55766   return __ret;
  55767 }
  55768 #endif
  55769 
  55770 #ifdef __LITTLE_ENDIAN__
  55771 __ai __attribute__((target("neon"))) int32x4_t vpmaxq_s32(int32x4_t __p0, int32x4_t __p1) {
  55772   int32x4_t __ret;
  55773   __ret = (int32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  55774   return __ret;
  55775 }
  55776 #else
  55777 __ai __attribute__((target("neon"))) int32x4_t vpmaxq_s32(int32x4_t __p0, int32x4_t __p1) {
  55778   int32x4_t __ret;
  55779   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55780   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55781   __ret = (int32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  55782   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55783   return __ret;
  55784 }
  55785 #endif
  55786 
  55787 #ifdef __LITTLE_ENDIAN__
  55788 __ai __attribute__((target("neon"))) int16x8_t vpmaxq_s16(int16x8_t __p0, int16x8_t __p1) {
  55789   int16x8_t __ret;
  55790   __ret = (int16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  55791   return __ret;
  55792 }
  55793 #else
  55794 __ai __attribute__((target("neon"))) int16x8_t vpmaxq_s16(int16x8_t __p0, int16x8_t __p1) {
  55795   int16x8_t __ret;
  55796   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  55797   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  55798   __ret = (int16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  55799   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  55800   return __ret;
  55801 }
  55802 #endif
  55803 
  55804 #ifdef __LITTLE_ENDIAN__
  55805 __ai __attribute__((target("neon"))) float64_t vpmaxqd_f64(float64x2_t __p0) {
  55806   float64_t __ret;
  55807   __ret = (float64_t) __builtin_neon_vpmaxqd_f64(__p0);
  55808   return __ret;
  55809 }
  55810 #else
  55811 __ai __attribute__((target("neon"))) float64_t vpmaxqd_f64(float64x2_t __p0) {
  55812   float64_t __ret;
  55813   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55814   __ret = (float64_t) __builtin_neon_vpmaxqd_f64(__rev0);
  55815   return __ret;
  55816 }
  55817 #endif
  55818 
  55819 #ifdef __LITTLE_ENDIAN__
  55820 __ai __attribute__((target("neon"))) float32_t vpmaxs_f32(float32x2_t __p0) {
  55821   float32_t __ret;
  55822   __ret = (float32_t) __builtin_neon_vpmaxs_f32(__p0);
  55823   return __ret;
  55824 }
  55825 #else
  55826 __ai __attribute__((target("neon"))) float32_t vpmaxs_f32(float32x2_t __p0) {
  55827   float32_t __ret;
  55828   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55829   __ret = (float32_t) __builtin_neon_vpmaxs_f32(__rev0);
  55830   return __ret;
  55831 }
  55832 #endif
  55833 
  55834 #ifdef __LITTLE_ENDIAN__
  55835 __ai __attribute__((target("neon"))) float64x2_t vpmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  55836   float64x2_t __ret;
  55837   __ret = (float64x2_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  55838   return __ret;
  55839 }
  55840 #else
  55841 __ai __attribute__((target("neon"))) float64x2_t vpmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  55842   float64x2_t __ret;
  55843   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55844   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55845   __ret = (float64x2_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  55846   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55847   return __ret;
  55848 }
  55849 #endif
  55850 
  55851 #ifdef __LITTLE_ENDIAN__
  55852 __ai __attribute__((target("neon"))) float32x4_t vpmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  55853   float32x4_t __ret;
  55854   __ret = (float32x4_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  55855   return __ret;
  55856 }
  55857 #else
  55858 __ai __attribute__((target("neon"))) float32x4_t vpmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  55859   float32x4_t __ret;
  55860   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55861   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55862   __ret = (float32x4_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  55863   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55864   return __ret;
  55865 }
  55866 #endif
  55867 
  55868 #ifdef __LITTLE_ENDIAN__
  55869 __ai __attribute__((target("neon"))) float32x2_t vpmaxnm_f32(float32x2_t __p0, float32x2_t __p1) {
  55870   float32x2_t __ret;
  55871   __ret = (float32x2_t) __builtin_neon_vpmaxnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  55872   return __ret;
  55873 }
  55874 #else
  55875 __ai __attribute__((target("neon"))) float32x2_t vpmaxnm_f32(float32x2_t __p0, float32x2_t __p1) {
  55876   float32x2_t __ret;
  55877   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55878   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55879   __ret = (float32x2_t) __builtin_neon_vpmaxnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  55880   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55881   return __ret;
  55882 }
  55883 #endif
  55884 
  55885 #ifdef __LITTLE_ENDIAN__
  55886 __ai __attribute__((target("neon"))) float64_t vpmaxnmqd_f64(float64x2_t __p0) {
  55887   float64_t __ret;
  55888   __ret = (float64_t) __builtin_neon_vpmaxnmqd_f64(__p0);
  55889   return __ret;
  55890 }
  55891 #else
  55892 __ai __attribute__((target("neon"))) float64_t vpmaxnmqd_f64(float64x2_t __p0) {
  55893   float64_t __ret;
  55894   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55895   __ret = (float64_t) __builtin_neon_vpmaxnmqd_f64(__rev0);
  55896   return __ret;
  55897 }
  55898 #endif
  55899 
  55900 #ifdef __LITTLE_ENDIAN__
  55901 __ai __attribute__((target("neon"))) float32_t vpmaxnms_f32(float32x2_t __p0) {
  55902   float32_t __ret;
  55903   __ret = (float32_t) __builtin_neon_vpmaxnms_f32(__p0);
  55904   return __ret;
  55905 }
  55906 #else
  55907 __ai __attribute__((target("neon"))) float32_t vpmaxnms_f32(float32x2_t __p0) {
  55908   float32_t __ret;
  55909   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55910   __ret = (float32_t) __builtin_neon_vpmaxnms_f32(__rev0);
  55911   return __ret;
  55912 }
  55913 #endif
  55914 
  55915 #ifdef __LITTLE_ENDIAN__
  55916 __ai __attribute__((target("neon"))) uint8x16_t vpminq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  55917   uint8x16_t __ret;
  55918   __ret = (uint8x16_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  55919   return __ret;
  55920 }
  55921 #else
  55922 __ai __attribute__((target("neon"))) uint8x16_t vpminq_u8(uint8x16_t __p0, uint8x16_t __p1) {
  55923   uint8x16_t __ret;
  55924   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55925   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55926   __ret = (uint8x16_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  55927   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55928   return __ret;
  55929 }
  55930 #endif
  55931 
  55932 #ifdef __LITTLE_ENDIAN__
  55933 __ai __attribute__((target("neon"))) uint32x4_t vpminq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  55934   uint32x4_t __ret;
  55935   __ret = (uint32x4_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  55936   return __ret;
  55937 }
  55938 #else
  55939 __ai __attribute__((target("neon"))) uint32x4_t vpminq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  55940   uint32x4_t __ret;
  55941   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  55942   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  55943   __ret = (uint32x4_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  55944   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  55945   return __ret;
  55946 }
  55947 #endif
  55948 
  55949 #ifdef __LITTLE_ENDIAN__
  55950 __ai __attribute__((target("neon"))) uint16x8_t vpminq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  55951   uint16x8_t __ret;
  55952   __ret = (uint16x8_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  55953   return __ret;
  55954 }
  55955 #else
  55956 __ai __attribute__((target("neon"))) uint16x8_t vpminq_u16(uint16x8_t __p0, uint16x8_t __p1) {
  55957   uint16x8_t __ret;
  55958   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  55959   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  55960   __ret = (uint16x8_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  55961   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  55962   return __ret;
  55963 }
  55964 #endif
  55965 
  55966 #ifdef __LITTLE_ENDIAN__
  55967 __ai __attribute__((target("neon"))) int8x16_t vpminq_s8(int8x16_t __p0, int8x16_t __p1) {
  55968   int8x16_t __ret;
  55969   __ret = (int8x16_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  55970   return __ret;
  55971 }
  55972 #else
  55973 __ai __attribute__((target("neon"))) int8x16_t vpminq_s8(int8x16_t __p0, int8x16_t __p1) {
  55974   int8x16_t __ret;
  55975   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55976   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55977   __ret = (int8x16_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  55978   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  55979   return __ret;
  55980 }
  55981 #endif
  55982 
  55983 #ifdef __LITTLE_ENDIAN__
  55984 __ai __attribute__((target("neon"))) float64x2_t vpminq_f64(float64x2_t __p0, float64x2_t __p1) {
  55985   float64x2_t __ret;
  55986   __ret = (float64x2_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  55987   return __ret;
  55988 }
  55989 #else
  55990 __ai __attribute__((target("neon"))) float64x2_t vpminq_f64(float64x2_t __p0, float64x2_t __p1) {
  55991   float64x2_t __ret;
  55992   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  55993   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  55994   __ret = (float64x2_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  55995   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  55996   return __ret;
  55997 }
  55998 #endif
  55999 
  56000 #ifdef __LITTLE_ENDIAN__
  56001 __ai __attribute__((target("neon"))) float32x4_t vpminq_f32(float32x4_t __p0, float32x4_t __p1) {
  56002   float32x4_t __ret;
  56003   __ret = (float32x4_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  56004   return __ret;
  56005 }
  56006 #else
  56007 __ai __attribute__((target("neon"))) float32x4_t vpminq_f32(float32x4_t __p0, float32x4_t __p1) {
  56008   float32x4_t __ret;
  56009   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56010   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56011   __ret = (float32x4_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  56012   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56013   return __ret;
  56014 }
  56015 #endif
  56016 
  56017 #ifdef __LITTLE_ENDIAN__
  56018 __ai __attribute__((target("neon"))) int32x4_t vpminq_s32(int32x4_t __p0, int32x4_t __p1) {
  56019   int32x4_t __ret;
  56020   __ret = (int32x4_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  56021   return __ret;
  56022 }
  56023 #else
  56024 __ai __attribute__((target("neon"))) int32x4_t vpminq_s32(int32x4_t __p0, int32x4_t __p1) {
  56025   int32x4_t __ret;
  56026   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56027   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56028   __ret = (int32x4_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  56029   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56030   return __ret;
  56031 }
  56032 #endif
  56033 
  56034 #ifdef __LITTLE_ENDIAN__
  56035 __ai __attribute__((target("neon"))) int16x8_t vpminq_s16(int16x8_t __p0, int16x8_t __p1) {
  56036   int16x8_t __ret;
  56037   __ret = (int16x8_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  56038   return __ret;
  56039 }
  56040 #else
  56041 __ai __attribute__((target("neon"))) int16x8_t vpminq_s16(int16x8_t __p0, int16x8_t __p1) {
  56042   int16x8_t __ret;
  56043   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  56044   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  56045   __ret = (int16x8_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  56046   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  56047   return __ret;
  56048 }
  56049 #endif
  56050 
  56051 #ifdef __LITTLE_ENDIAN__
  56052 __ai __attribute__((target("neon"))) float64_t vpminqd_f64(float64x2_t __p0) {
  56053   float64_t __ret;
  56054   __ret = (float64_t) __builtin_neon_vpminqd_f64(__p0);
  56055   return __ret;
  56056 }
  56057 #else
  56058 __ai __attribute__((target("neon"))) float64_t vpminqd_f64(float64x2_t __p0) {
  56059   float64_t __ret;
  56060   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56061   __ret = (float64_t) __builtin_neon_vpminqd_f64(__rev0);
  56062   return __ret;
  56063 }
  56064 #endif
  56065 
  56066 #ifdef __LITTLE_ENDIAN__
  56067 __ai __attribute__((target("neon"))) float32_t vpmins_f32(float32x2_t __p0) {
  56068   float32_t __ret;
  56069   __ret = (float32_t) __builtin_neon_vpmins_f32(__p0);
  56070   return __ret;
  56071 }
  56072 #else
  56073 __ai __attribute__((target("neon"))) float32_t vpmins_f32(float32x2_t __p0) {
  56074   float32_t __ret;
  56075   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56076   __ret = (float32_t) __builtin_neon_vpmins_f32(__rev0);
  56077   return __ret;
  56078 }
  56079 #endif
  56080 
  56081 #ifdef __LITTLE_ENDIAN__
  56082 __ai __attribute__((target("neon"))) float64x2_t vpminnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  56083   float64x2_t __ret;
  56084   __ret = (float64x2_t) __builtin_neon_vpminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  56085   return __ret;
  56086 }
  56087 #else
  56088 __ai __attribute__((target("neon"))) float64x2_t vpminnmq_f64(float64x2_t __p0, float64x2_t __p1) {
  56089   float64x2_t __ret;
  56090   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56091   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  56092   __ret = (float64x2_t) __builtin_neon_vpminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  56093   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56094   return __ret;
  56095 }
  56096 #endif
  56097 
  56098 #ifdef __LITTLE_ENDIAN__
  56099 __ai __attribute__((target("neon"))) float32x4_t vpminnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  56100   float32x4_t __ret;
  56101   __ret = (float32x4_t) __builtin_neon_vpminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41);
  56102   return __ret;
  56103 }
  56104 #else
  56105 __ai __attribute__((target("neon"))) float32x4_t vpminnmq_f32(float32x4_t __p0, float32x4_t __p1) {
  56106   float32x4_t __ret;
  56107   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56108   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56109   __ret = (float32x4_t) __builtin_neon_vpminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41);
  56110   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56111   return __ret;
  56112 }
  56113 #endif
  56114 
  56115 #ifdef __LITTLE_ENDIAN__
  56116 __ai __attribute__((target("neon"))) float32x2_t vpminnm_f32(float32x2_t __p0, float32x2_t __p1) {
  56117   float32x2_t __ret;
  56118   __ret = (float32x2_t) __builtin_neon_vpminnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9);
  56119   return __ret;
  56120 }
  56121 #else
  56122 __ai __attribute__((target("neon"))) float32x2_t vpminnm_f32(float32x2_t __p0, float32x2_t __p1) {
  56123   float32x2_t __ret;
  56124   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56125   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  56126   __ret = (float32x2_t) __builtin_neon_vpminnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9);
  56127   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56128   return __ret;
  56129 }
  56130 #endif
  56131 
  56132 #ifdef __LITTLE_ENDIAN__
  56133 __ai __attribute__((target("neon"))) float64_t vpminnmqd_f64(float64x2_t __p0) {
  56134   float64_t __ret;
  56135   __ret = (float64_t) __builtin_neon_vpminnmqd_f64(__p0);
  56136   return __ret;
  56137 }
  56138 #else
  56139 __ai __attribute__((target("neon"))) float64_t vpminnmqd_f64(float64x2_t __p0) {
  56140   float64_t __ret;
  56141   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56142   __ret = (float64_t) __builtin_neon_vpminnmqd_f64(__rev0);
  56143   return __ret;
  56144 }
  56145 #endif
  56146 
  56147 #ifdef __LITTLE_ENDIAN__
  56148 __ai __attribute__((target("neon"))) float32_t vpminnms_f32(float32x2_t __p0) {
  56149   float32_t __ret;
  56150   __ret = (float32_t) __builtin_neon_vpminnms_f32(__p0);
  56151   return __ret;
  56152 }
  56153 #else
  56154 __ai __attribute__((target("neon"))) float32_t vpminnms_f32(float32x2_t __p0) {
  56155   float32_t __ret;
  56156   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56157   __ret = (float32_t) __builtin_neon_vpminnms_f32(__rev0);
  56158   return __ret;
  56159 }
  56160 #endif
  56161 
  56162 #ifdef __LITTLE_ENDIAN__
  56163 __ai __attribute__((target("neon"))) int64x2_t vqabsq_s64(int64x2_t __p0) {
  56164   int64x2_t __ret;
  56165   __ret = (int64x2_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 35);
  56166   return __ret;
  56167 }
  56168 #else
  56169 __ai __attribute__((target("neon"))) int64x2_t vqabsq_s64(int64x2_t __p0) {
  56170   int64x2_t __ret;
  56171   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56172   __ret = (int64x2_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 35);
  56173   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56174   return __ret;
  56175 }
  56176 #endif
  56177 
  56178 __ai __attribute__((target("neon"))) int64x1_t vqabs_s64(int64x1_t __p0) {
  56179   int64x1_t __ret;
  56180   __ret = (int64x1_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 3);
  56181   return __ret;
  56182 }
  56183 __ai __attribute__((target("neon"))) int8_t vqabsb_s8(int8_t __p0) {
  56184   int8_t __ret;
  56185   __ret = (int8_t) __builtin_neon_vqabsb_s8(__p0);
  56186   return __ret;
  56187 }
  56188 __ai __attribute__((target("neon"))) int32_t vqabss_s32(int32_t __p0) {
  56189   int32_t __ret;
  56190   __ret = (int32_t) __builtin_neon_vqabss_s32(__p0);
  56191   return __ret;
  56192 }
  56193 __ai __attribute__((target("neon"))) int64_t vqabsd_s64(int64_t __p0) {
  56194   int64_t __ret;
  56195   __ret = (int64_t) __builtin_neon_vqabsd_s64(__p0);
  56196   return __ret;
  56197 }
  56198 __ai __attribute__((target("neon"))) int16_t vqabsh_s16(int16_t __p0) {
  56199   int16_t __ret;
  56200   __ret = (int16_t) __builtin_neon_vqabsh_s16(__p0);
  56201   return __ret;
  56202 }
  56203 __ai __attribute__((target("neon"))) uint8_t vqaddb_u8(uint8_t __p0, uint8_t __p1) {
  56204   uint8_t __ret;
  56205   __ret = (uint8_t) __builtin_neon_vqaddb_u8(__p0, __p1);
  56206   return __ret;
  56207 }
  56208 __ai __attribute__((target("neon"))) uint32_t vqadds_u32(uint32_t __p0, uint32_t __p1) {
  56209   uint32_t __ret;
  56210   __ret = (uint32_t) __builtin_neon_vqadds_u32(__p0, __p1);
  56211   return __ret;
  56212 }
  56213 __ai __attribute__((target("neon"))) uint64_t vqaddd_u64(uint64_t __p0, uint64_t __p1) {
  56214   uint64_t __ret;
  56215   __ret = (uint64_t) __builtin_neon_vqaddd_u64(__p0, __p1);
  56216   return __ret;
  56217 }
  56218 __ai __attribute__((target("neon"))) uint16_t vqaddh_u16(uint16_t __p0, uint16_t __p1) {
  56219   uint16_t __ret;
  56220   __ret = (uint16_t) __builtin_neon_vqaddh_u16(__p0, __p1);
  56221   return __ret;
  56222 }
  56223 __ai __attribute__((target("neon"))) int8_t vqaddb_s8(int8_t __p0, int8_t __p1) {
  56224   int8_t __ret;
  56225   __ret = (int8_t) __builtin_neon_vqaddb_s8(__p0, __p1);
  56226   return __ret;
  56227 }
  56228 __ai __attribute__((target("neon"))) int32_t vqadds_s32(int32_t __p0, int32_t __p1) {
  56229   int32_t __ret;
  56230   __ret = (int32_t) __builtin_neon_vqadds_s32(__p0, __p1);
  56231   return __ret;
  56232 }
  56233 __ai __attribute__((target("neon"))) int64_t vqaddd_s64(int64_t __p0, int64_t __p1) {
  56234   int64_t __ret;
  56235   __ret = (int64_t) __builtin_neon_vqaddd_s64(__p0, __p1);
  56236   return __ret;
  56237 }
  56238 __ai __attribute__((target("neon"))) int16_t vqaddh_s16(int16_t __p0, int16_t __p1) {
  56239   int16_t __ret;
  56240   __ret = (int16_t) __builtin_neon_vqaddh_s16(__p0, __p1);
  56241   return __ret;
  56242 }
  56243 __ai __attribute__((target("neon"))) int64_t vqdmlals_s32(int64_t __p0, int32_t __p1, int32_t __p2) {
  56244   int64_t __ret;
  56245   __ret = (int64_t) __builtin_neon_vqdmlals_s32(__p0, __p1, __p2);
  56246   return __ret;
  56247 }
  56248 __ai __attribute__((target("neon"))) int32_t vqdmlalh_s16(int32_t __p0, int16_t __p1, int16_t __p2) {
  56249   int32_t __ret;
  56250   __ret = (int32_t) __builtin_neon_vqdmlalh_s16(__p0, __p1, __p2);
  56251   return __ret;
  56252 }
  56253 #ifdef __LITTLE_ENDIAN__
  56254 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  56255   int64x2_t __ret;
  56256   __ret = vqdmlal_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2));
  56257   return __ret;
  56258 }
  56259 #else
  56260 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  56261   int64x2_t __ret;
  56262   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56263   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56264   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  56265   __ret = __noswap_vqdmlal_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2));
  56266   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56267   return __ret;
  56268 }
  56269 #endif
  56270 
  56271 #ifdef __LITTLE_ENDIAN__
  56272 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  56273   int32x4_t __ret;
  56274   __ret = vqdmlal_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2));
  56275   return __ret;
  56276 }
  56277 #else
  56278 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  56279   int32x4_t __ret;
  56280   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56281   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  56282   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  56283   __ret = __noswap_vqdmlal_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2));
  56284   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56285   return __ret;
  56286 }
  56287 #endif
  56288 
  56289 #ifdef __LITTLE_ENDIAN__
  56290 #define vqdmlal_high_lane_s32(__p0_628, __p1_628, __p2_628, __p3_628) __extension__ ({ \
  56291   int64x2_t __ret_628; \
  56292   int64x2_t __s0_628 = __p0_628; \
  56293   int32x4_t __s1_628 = __p1_628; \
  56294   int32x2_t __s2_628 = __p2_628; \
  56295   __ret_628 = vqdmlal_s32(__s0_628, vget_high_s32(__s1_628), splat_lane_s32(__s2_628, __p3_628)); \
  56296   __ret_628; \
  56297 })
  56298 #else
  56299 #define vqdmlal_high_lane_s32(__p0_629, __p1_629, __p2_629, __p3_629) __extension__ ({ \
  56300   int64x2_t __ret_629; \
  56301   int64x2_t __s0_629 = __p0_629; \
  56302   int32x4_t __s1_629 = __p1_629; \
  56303   int32x2_t __s2_629 = __p2_629; \
  56304   int64x2_t __rev0_629;  __rev0_629 = __builtin_shufflevector(__s0_629, __s0_629, 1, 0); \
  56305   int32x4_t __rev1_629;  __rev1_629 = __builtin_shufflevector(__s1_629, __s1_629, 3, 2, 1, 0); \
  56306   int32x2_t __rev2_629;  __rev2_629 = __builtin_shufflevector(__s2_629, __s2_629, 1, 0); \
  56307   __ret_629 = __noswap_vqdmlal_s32(__rev0_629, __noswap_vget_high_s32(__rev1_629), __noswap_splat_lane_s32(__rev2_629, __p3_629)); \
  56308   __ret_629 = __builtin_shufflevector(__ret_629, __ret_629, 1, 0); \
  56309   __ret_629; \
  56310 })
  56311 #endif
  56312 
  56313 #ifdef __LITTLE_ENDIAN__
  56314 #define vqdmlal_high_lane_s16(__p0_630, __p1_630, __p2_630, __p3_630) __extension__ ({ \
  56315   int32x4_t __ret_630; \
  56316   int32x4_t __s0_630 = __p0_630; \
  56317   int16x8_t __s1_630 = __p1_630; \
  56318   int16x4_t __s2_630 = __p2_630; \
  56319   __ret_630 = vqdmlal_s16(__s0_630, vget_high_s16(__s1_630), splat_lane_s16(__s2_630, __p3_630)); \
  56320   __ret_630; \
  56321 })
  56322 #else
  56323 #define vqdmlal_high_lane_s16(__p0_631, __p1_631, __p2_631, __p3_631) __extension__ ({ \
  56324   int32x4_t __ret_631; \
  56325   int32x4_t __s0_631 = __p0_631; \
  56326   int16x8_t __s1_631 = __p1_631; \
  56327   int16x4_t __s2_631 = __p2_631; \
  56328   int32x4_t __rev0_631;  __rev0_631 = __builtin_shufflevector(__s0_631, __s0_631, 3, 2, 1, 0); \
  56329   int16x8_t __rev1_631;  __rev1_631 = __builtin_shufflevector(__s1_631, __s1_631, 7, 6, 5, 4, 3, 2, 1, 0); \
  56330   int16x4_t __rev2_631;  __rev2_631 = __builtin_shufflevector(__s2_631, __s2_631, 3, 2, 1, 0); \
  56331   __ret_631 = __noswap_vqdmlal_s16(__rev0_631, __noswap_vget_high_s16(__rev1_631), __noswap_splat_lane_s16(__rev2_631, __p3_631)); \
  56332   __ret_631 = __builtin_shufflevector(__ret_631, __ret_631, 3, 2, 1, 0); \
  56333   __ret_631; \
  56334 })
  56335 #endif
  56336 
  56337 #ifdef __LITTLE_ENDIAN__
  56338 #define vqdmlal_high_laneq_s32(__p0_632, __p1_632, __p2_632, __p3_632) __extension__ ({ \
  56339   int64x2_t __ret_632; \
  56340   int64x2_t __s0_632 = __p0_632; \
  56341   int32x4_t __s1_632 = __p1_632; \
  56342   int32x4_t __s2_632 = __p2_632; \
  56343   __ret_632 = vqdmlal_s32(__s0_632, vget_high_s32(__s1_632), splat_laneq_s32(__s2_632, __p3_632)); \
  56344   __ret_632; \
  56345 })
  56346 #else
  56347 #define vqdmlal_high_laneq_s32(__p0_633, __p1_633, __p2_633, __p3_633) __extension__ ({ \
  56348   int64x2_t __ret_633; \
  56349   int64x2_t __s0_633 = __p0_633; \
  56350   int32x4_t __s1_633 = __p1_633; \
  56351   int32x4_t __s2_633 = __p2_633; \
  56352   int64x2_t __rev0_633;  __rev0_633 = __builtin_shufflevector(__s0_633, __s0_633, 1, 0); \
  56353   int32x4_t __rev1_633;  __rev1_633 = __builtin_shufflevector(__s1_633, __s1_633, 3, 2, 1, 0); \
  56354   int32x4_t __rev2_633;  __rev2_633 = __builtin_shufflevector(__s2_633, __s2_633, 3, 2, 1, 0); \
  56355   __ret_633 = __noswap_vqdmlal_s32(__rev0_633, __noswap_vget_high_s32(__rev1_633), __noswap_splat_laneq_s32(__rev2_633, __p3_633)); \
  56356   __ret_633 = __builtin_shufflevector(__ret_633, __ret_633, 1, 0); \
  56357   __ret_633; \
  56358 })
  56359 #endif
  56360 
  56361 #ifdef __LITTLE_ENDIAN__
  56362 #define vqdmlal_high_laneq_s16(__p0_634, __p1_634, __p2_634, __p3_634) __extension__ ({ \
  56363   int32x4_t __ret_634; \
  56364   int32x4_t __s0_634 = __p0_634; \
  56365   int16x8_t __s1_634 = __p1_634; \
  56366   int16x8_t __s2_634 = __p2_634; \
  56367   __ret_634 = vqdmlal_s16(__s0_634, vget_high_s16(__s1_634), splat_laneq_s16(__s2_634, __p3_634)); \
  56368   __ret_634; \
  56369 })
  56370 #else
  56371 #define vqdmlal_high_laneq_s16(__p0_635, __p1_635, __p2_635, __p3_635) __extension__ ({ \
  56372   int32x4_t __ret_635; \
  56373   int32x4_t __s0_635 = __p0_635; \
  56374   int16x8_t __s1_635 = __p1_635; \
  56375   int16x8_t __s2_635 = __p2_635; \
  56376   int32x4_t __rev0_635;  __rev0_635 = __builtin_shufflevector(__s0_635, __s0_635, 3, 2, 1, 0); \
  56377   int16x8_t __rev1_635;  __rev1_635 = __builtin_shufflevector(__s1_635, __s1_635, 7, 6, 5, 4, 3, 2, 1, 0); \
  56378   int16x8_t __rev2_635;  __rev2_635 = __builtin_shufflevector(__s2_635, __s2_635, 7, 6, 5, 4, 3, 2, 1, 0); \
  56379   __ret_635 = __noswap_vqdmlal_s16(__rev0_635, __noswap_vget_high_s16(__rev1_635), __noswap_splat_laneq_s16(__rev2_635, __p3_635)); \
  56380   __ret_635 = __builtin_shufflevector(__ret_635, __ret_635, 3, 2, 1, 0); \
  56381   __ret_635; \
  56382 })
  56383 #endif
  56384 
  56385 #ifdef __LITTLE_ENDIAN__
  56386 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  56387   int64x2_t __ret;
  56388   __ret = vqdmlal_n_s32(__p0, vget_high_s32(__p1), __p2);
  56389   return __ret;
  56390 }
  56391 #else
  56392 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  56393   int64x2_t __ret;
  56394   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56395   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56396   __ret = __noswap_vqdmlal_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2);
  56397   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56398   return __ret;
  56399 }
  56400 #endif
  56401 
  56402 #ifdef __LITTLE_ENDIAN__
  56403 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  56404   int32x4_t __ret;
  56405   __ret = vqdmlal_n_s16(__p0, vget_high_s16(__p1), __p2);
  56406   return __ret;
  56407 }
  56408 #else
  56409 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  56410   int32x4_t __ret;
  56411   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56412   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  56413   __ret = __noswap_vqdmlal_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2);
  56414   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56415   return __ret;
  56416 }
  56417 #endif
  56418 
  56419 #ifdef __LITTLE_ENDIAN__
  56420 #define vqdmlals_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56421   int64_t __ret; \
  56422   int64_t __s0 = __p0; \
  56423   int32_t __s1 = __p1; \
  56424   int32x2_t __s2 = __p2; \
  56425   __ret = (int64_t) __builtin_neon_vqdmlals_lane_s32(__s0, __s1, __s2, __p3); \
  56426   __ret; \
  56427 })
  56428 #else
  56429 #define vqdmlals_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56430   int64_t __ret; \
  56431   int64_t __s0 = __p0; \
  56432   int32_t __s1 = __p1; \
  56433   int32x2_t __s2 = __p2; \
  56434   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  56435   __ret = (int64_t) __builtin_neon_vqdmlals_lane_s32(__s0, __s1, __rev2, __p3); \
  56436   __ret; \
  56437 })
  56438 #endif
  56439 
  56440 #ifdef __LITTLE_ENDIAN__
  56441 #define vqdmlalh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56442   int32_t __ret; \
  56443   int32_t __s0 = __p0; \
  56444   int16_t __s1 = __p1; \
  56445   int16x4_t __s2 = __p2; \
  56446   __ret = (int32_t) __builtin_neon_vqdmlalh_lane_s16(__s0, __s1, __s2, __p3); \
  56447   __ret; \
  56448 })
  56449 #else
  56450 #define vqdmlalh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56451   int32_t __ret; \
  56452   int32_t __s0 = __p0; \
  56453   int16_t __s1 = __p1; \
  56454   int16x4_t __s2 = __p2; \
  56455   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  56456   __ret = (int32_t) __builtin_neon_vqdmlalh_lane_s16(__s0, __s1, __rev2, __p3); \
  56457   __ret; \
  56458 })
  56459 #endif
  56460 
  56461 #ifdef __LITTLE_ENDIAN__
  56462 #define vqdmlals_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56463   int64_t __ret; \
  56464   int64_t __s0 = __p0; \
  56465   int32_t __s1 = __p1; \
  56466   int32x4_t __s2 = __p2; \
  56467   __ret = (int64_t) __builtin_neon_vqdmlals_laneq_s32(__s0, __s1, __s2, __p3); \
  56468   __ret; \
  56469 })
  56470 #else
  56471 #define vqdmlals_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56472   int64_t __ret; \
  56473   int64_t __s0 = __p0; \
  56474   int32_t __s1 = __p1; \
  56475   int32x4_t __s2 = __p2; \
  56476   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  56477   __ret = (int64_t) __builtin_neon_vqdmlals_laneq_s32(__s0, __s1, __rev2, __p3); \
  56478   __ret; \
  56479 })
  56480 #endif
  56481 
  56482 #ifdef __LITTLE_ENDIAN__
  56483 #define vqdmlalh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56484   int32_t __ret; \
  56485   int32_t __s0 = __p0; \
  56486   int16_t __s1 = __p1; \
  56487   int16x8_t __s2 = __p2; \
  56488   __ret = (int32_t) __builtin_neon_vqdmlalh_laneq_s16(__s0, __s1, __s2, __p3); \
  56489   __ret; \
  56490 })
  56491 #else
  56492 #define vqdmlalh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56493   int32_t __ret; \
  56494   int32_t __s0 = __p0; \
  56495   int16_t __s1 = __p1; \
  56496   int16x8_t __s2 = __p2; \
  56497   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  56498   __ret = (int32_t) __builtin_neon_vqdmlalh_laneq_s16(__s0, __s1, __rev2, __p3); \
  56499   __ret; \
  56500 })
  56501 #endif
  56502 
  56503 #ifdef __LITTLE_ENDIAN__
  56504 #define vqdmlal_laneq_s32(__p0_636, __p1_636, __p2_636, __p3_636) __extension__ ({ \
  56505   int64x2_t __ret_636; \
  56506   int64x2_t __s0_636 = __p0_636; \
  56507   int32x2_t __s1_636 = __p1_636; \
  56508   int32x4_t __s2_636 = __p2_636; \
  56509   __ret_636 = vqdmlal_s32(__s0_636, __s1_636, splat_laneq_s32(__s2_636, __p3_636)); \
  56510   __ret_636; \
  56511 })
  56512 #else
  56513 #define vqdmlal_laneq_s32(__p0_637, __p1_637, __p2_637, __p3_637) __extension__ ({ \
  56514   int64x2_t __ret_637; \
  56515   int64x2_t __s0_637 = __p0_637; \
  56516   int32x2_t __s1_637 = __p1_637; \
  56517   int32x4_t __s2_637 = __p2_637; \
  56518   int64x2_t __rev0_637;  __rev0_637 = __builtin_shufflevector(__s0_637, __s0_637, 1, 0); \
  56519   int32x2_t __rev1_637;  __rev1_637 = __builtin_shufflevector(__s1_637, __s1_637, 1, 0); \
  56520   int32x4_t __rev2_637;  __rev2_637 = __builtin_shufflevector(__s2_637, __s2_637, 3, 2, 1, 0); \
  56521   __ret_637 = __noswap_vqdmlal_s32(__rev0_637, __rev1_637, __noswap_splat_laneq_s32(__rev2_637, __p3_637)); \
  56522   __ret_637 = __builtin_shufflevector(__ret_637, __ret_637, 1, 0); \
  56523   __ret_637; \
  56524 })
  56525 #endif
  56526 
  56527 #ifdef __LITTLE_ENDIAN__
  56528 #define vqdmlal_laneq_s16(__p0_638, __p1_638, __p2_638, __p3_638) __extension__ ({ \
  56529   int32x4_t __ret_638; \
  56530   int32x4_t __s0_638 = __p0_638; \
  56531   int16x4_t __s1_638 = __p1_638; \
  56532   int16x8_t __s2_638 = __p2_638; \
  56533   __ret_638 = vqdmlal_s16(__s0_638, __s1_638, splat_laneq_s16(__s2_638, __p3_638)); \
  56534   __ret_638; \
  56535 })
  56536 #else
  56537 #define vqdmlal_laneq_s16(__p0_639, __p1_639, __p2_639, __p3_639) __extension__ ({ \
  56538   int32x4_t __ret_639; \
  56539   int32x4_t __s0_639 = __p0_639; \
  56540   int16x4_t __s1_639 = __p1_639; \
  56541   int16x8_t __s2_639 = __p2_639; \
  56542   int32x4_t __rev0_639;  __rev0_639 = __builtin_shufflevector(__s0_639, __s0_639, 3, 2, 1, 0); \
  56543   int16x4_t __rev1_639;  __rev1_639 = __builtin_shufflevector(__s1_639, __s1_639, 3, 2, 1, 0); \
  56544   int16x8_t __rev2_639;  __rev2_639 = __builtin_shufflevector(__s2_639, __s2_639, 7, 6, 5, 4, 3, 2, 1, 0); \
  56545   __ret_639 = __noswap_vqdmlal_s16(__rev0_639, __rev1_639, __noswap_splat_laneq_s16(__rev2_639, __p3_639)); \
  56546   __ret_639 = __builtin_shufflevector(__ret_639, __ret_639, 3, 2, 1, 0); \
  56547   __ret_639; \
  56548 })
  56549 #endif
  56550 
  56551 __ai __attribute__((target("neon"))) int64_t vqdmlsls_s32(int64_t __p0, int32_t __p1, int32_t __p2) {
  56552   int64_t __ret;
  56553   __ret = (int64_t) __builtin_neon_vqdmlsls_s32(__p0, __p1, __p2);
  56554   return __ret;
  56555 }
  56556 __ai __attribute__((target("neon"))) int32_t vqdmlslh_s16(int32_t __p0, int16_t __p1, int16_t __p2) {
  56557   int32_t __ret;
  56558   __ret = (int32_t) __builtin_neon_vqdmlslh_s16(__p0, __p1, __p2);
  56559   return __ret;
  56560 }
  56561 #ifdef __LITTLE_ENDIAN__
  56562 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  56563   int64x2_t __ret;
  56564   __ret = vqdmlsl_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2));
  56565   return __ret;
  56566 }
  56567 #else
  56568 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  56569   int64x2_t __ret;
  56570   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56571   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56572   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  56573   __ret = __noswap_vqdmlsl_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2));
  56574   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56575   return __ret;
  56576 }
  56577 #endif
  56578 
  56579 #ifdef __LITTLE_ENDIAN__
  56580 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  56581   int32x4_t __ret;
  56582   __ret = vqdmlsl_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2));
  56583   return __ret;
  56584 }
  56585 #else
  56586 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  56587   int32x4_t __ret;
  56588   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56589   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  56590   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  56591   __ret = __noswap_vqdmlsl_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2));
  56592   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56593   return __ret;
  56594 }
  56595 #endif
  56596 
  56597 #ifdef __LITTLE_ENDIAN__
  56598 #define vqdmlsl_high_lane_s32(__p0_640, __p1_640, __p2_640, __p3_640) __extension__ ({ \
  56599   int64x2_t __ret_640; \
  56600   int64x2_t __s0_640 = __p0_640; \
  56601   int32x4_t __s1_640 = __p1_640; \
  56602   int32x2_t __s2_640 = __p2_640; \
  56603   __ret_640 = vqdmlsl_s32(__s0_640, vget_high_s32(__s1_640), splat_lane_s32(__s2_640, __p3_640)); \
  56604   __ret_640; \
  56605 })
  56606 #else
  56607 #define vqdmlsl_high_lane_s32(__p0_641, __p1_641, __p2_641, __p3_641) __extension__ ({ \
  56608   int64x2_t __ret_641; \
  56609   int64x2_t __s0_641 = __p0_641; \
  56610   int32x4_t __s1_641 = __p1_641; \
  56611   int32x2_t __s2_641 = __p2_641; \
  56612   int64x2_t __rev0_641;  __rev0_641 = __builtin_shufflevector(__s0_641, __s0_641, 1, 0); \
  56613   int32x4_t __rev1_641;  __rev1_641 = __builtin_shufflevector(__s1_641, __s1_641, 3, 2, 1, 0); \
  56614   int32x2_t __rev2_641;  __rev2_641 = __builtin_shufflevector(__s2_641, __s2_641, 1, 0); \
  56615   __ret_641 = __noswap_vqdmlsl_s32(__rev0_641, __noswap_vget_high_s32(__rev1_641), __noswap_splat_lane_s32(__rev2_641, __p3_641)); \
  56616   __ret_641 = __builtin_shufflevector(__ret_641, __ret_641, 1, 0); \
  56617   __ret_641; \
  56618 })
  56619 #endif
  56620 
  56621 #ifdef __LITTLE_ENDIAN__
  56622 #define vqdmlsl_high_lane_s16(__p0_642, __p1_642, __p2_642, __p3_642) __extension__ ({ \
  56623   int32x4_t __ret_642; \
  56624   int32x4_t __s0_642 = __p0_642; \
  56625   int16x8_t __s1_642 = __p1_642; \
  56626   int16x4_t __s2_642 = __p2_642; \
  56627   __ret_642 = vqdmlsl_s16(__s0_642, vget_high_s16(__s1_642), splat_lane_s16(__s2_642, __p3_642)); \
  56628   __ret_642; \
  56629 })
  56630 #else
  56631 #define vqdmlsl_high_lane_s16(__p0_643, __p1_643, __p2_643, __p3_643) __extension__ ({ \
  56632   int32x4_t __ret_643; \
  56633   int32x4_t __s0_643 = __p0_643; \
  56634   int16x8_t __s1_643 = __p1_643; \
  56635   int16x4_t __s2_643 = __p2_643; \
  56636   int32x4_t __rev0_643;  __rev0_643 = __builtin_shufflevector(__s0_643, __s0_643, 3, 2, 1, 0); \
  56637   int16x8_t __rev1_643;  __rev1_643 = __builtin_shufflevector(__s1_643, __s1_643, 7, 6, 5, 4, 3, 2, 1, 0); \
  56638   int16x4_t __rev2_643;  __rev2_643 = __builtin_shufflevector(__s2_643, __s2_643, 3, 2, 1, 0); \
  56639   __ret_643 = __noswap_vqdmlsl_s16(__rev0_643, __noswap_vget_high_s16(__rev1_643), __noswap_splat_lane_s16(__rev2_643, __p3_643)); \
  56640   __ret_643 = __builtin_shufflevector(__ret_643, __ret_643, 3, 2, 1, 0); \
  56641   __ret_643; \
  56642 })
  56643 #endif
  56644 
  56645 #ifdef __LITTLE_ENDIAN__
  56646 #define vqdmlsl_high_laneq_s32(__p0_644, __p1_644, __p2_644, __p3_644) __extension__ ({ \
  56647   int64x2_t __ret_644; \
  56648   int64x2_t __s0_644 = __p0_644; \
  56649   int32x4_t __s1_644 = __p1_644; \
  56650   int32x4_t __s2_644 = __p2_644; \
  56651   __ret_644 = vqdmlsl_s32(__s0_644, vget_high_s32(__s1_644), splat_laneq_s32(__s2_644, __p3_644)); \
  56652   __ret_644; \
  56653 })
  56654 #else
  56655 #define vqdmlsl_high_laneq_s32(__p0_645, __p1_645, __p2_645, __p3_645) __extension__ ({ \
  56656   int64x2_t __ret_645; \
  56657   int64x2_t __s0_645 = __p0_645; \
  56658   int32x4_t __s1_645 = __p1_645; \
  56659   int32x4_t __s2_645 = __p2_645; \
  56660   int64x2_t __rev0_645;  __rev0_645 = __builtin_shufflevector(__s0_645, __s0_645, 1, 0); \
  56661   int32x4_t __rev1_645;  __rev1_645 = __builtin_shufflevector(__s1_645, __s1_645, 3, 2, 1, 0); \
  56662   int32x4_t __rev2_645;  __rev2_645 = __builtin_shufflevector(__s2_645, __s2_645, 3, 2, 1, 0); \
  56663   __ret_645 = __noswap_vqdmlsl_s32(__rev0_645, __noswap_vget_high_s32(__rev1_645), __noswap_splat_laneq_s32(__rev2_645, __p3_645)); \
  56664   __ret_645 = __builtin_shufflevector(__ret_645, __ret_645, 1, 0); \
  56665   __ret_645; \
  56666 })
  56667 #endif
  56668 
  56669 #ifdef __LITTLE_ENDIAN__
  56670 #define vqdmlsl_high_laneq_s16(__p0_646, __p1_646, __p2_646, __p3_646) __extension__ ({ \
  56671   int32x4_t __ret_646; \
  56672   int32x4_t __s0_646 = __p0_646; \
  56673   int16x8_t __s1_646 = __p1_646; \
  56674   int16x8_t __s2_646 = __p2_646; \
  56675   __ret_646 = vqdmlsl_s16(__s0_646, vget_high_s16(__s1_646), splat_laneq_s16(__s2_646, __p3_646)); \
  56676   __ret_646; \
  56677 })
  56678 #else
  56679 #define vqdmlsl_high_laneq_s16(__p0_647, __p1_647, __p2_647, __p3_647) __extension__ ({ \
  56680   int32x4_t __ret_647; \
  56681   int32x4_t __s0_647 = __p0_647; \
  56682   int16x8_t __s1_647 = __p1_647; \
  56683   int16x8_t __s2_647 = __p2_647; \
  56684   int32x4_t __rev0_647;  __rev0_647 = __builtin_shufflevector(__s0_647, __s0_647, 3, 2, 1, 0); \
  56685   int16x8_t __rev1_647;  __rev1_647 = __builtin_shufflevector(__s1_647, __s1_647, 7, 6, 5, 4, 3, 2, 1, 0); \
  56686   int16x8_t __rev2_647;  __rev2_647 = __builtin_shufflevector(__s2_647, __s2_647, 7, 6, 5, 4, 3, 2, 1, 0); \
  56687   __ret_647 = __noswap_vqdmlsl_s16(__rev0_647, __noswap_vget_high_s16(__rev1_647), __noswap_splat_laneq_s16(__rev2_647, __p3_647)); \
  56688   __ret_647 = __builtin_shufflevector(__ret_647, __ret_647, 3, 2, 1, 0); \
  56689   __ret_647; \
  56690 })
  56691 #endif
  56692 
  56693 #ifdef __LITTLE_ENDIAN__
  56694 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  56695   int64x2_t __ret;
  56696   __ret = vqdmlsl_n_s32(__p0, vget_high_s32(__p1), __p2);
  56697   return __ret;
  56698 }
  56699 #else
  56700 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  56701   int64x2_t __ret;
  56702   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  56703   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  56704   __ret = __noswap_vqdmlsl_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2);
  56705   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  56706   return __ret;
  56707 }
  56708 #endif
  56709 
  56710 #ifdef __LITTLE_ENDIAN__
  56711 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  56712   int32x4_t __ret;
  56713   __ret = vqdmlsl_n_s16(__p0, vget_high_s16(__p1), __p2);
  56714   return __ret;
  56715 }
  56716 #else
  56717 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  56718   int32x4_t __ret;
  56719   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  56720   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  56721   __ret = __noswap_vqdmlsl_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2);
  56722   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  56723   return __ret;
  56724 }
  56725 #endif
  56726 
  56727 #ifdef __LITTLE_ENDIAN__
  56728 #define vqdmlsls_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56729   int64_t __ret; \
  56730   int64_t __s0 = __p0; \
  56731   int32_t __s1 = __p1; \
  56732   int32x2_t __s2 = __p2; \
  56733   __ret = (int64_t) __builtin_neon_vqdmlsls_lane_s32(__s0, __s1, __s2, __p3); \
  56734   __ret; \
  56735 })
  56736 #else
  56737 #define vqdmlsls_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56738   int64_t __ret; \
  56739   int64_t __s0 = __p0; \
  56740   int32_t __s1 = __p1; \
  56741   int32x2_t __s2 = __p2; \
  56742   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \
  56743   __ret = (int64_t) __builtin_neon_vqdmlsls_lane_s32(__s0, __s1, __rev2, __p3); \
  56744   __ret; \
  56745 })
  56746 #endif
  56747 
  56748 #ifdef __LITTLE_ENDIAN__
  56749 #define vqdmlslh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56750   int32_t __ret; \
  56751   int32_t __s0 = __p0; \
  56752   int16_t __s1 = __p1; \
  56753   int16x4_t __s2 = __p2; \
  56754   __ret = (int32_t) __builtin_neon_vqdmlslh_lane_s16(__s0, __s1, __s2, __p3); \
  56755   __ret; \
  56756 })
  56757 #else
  56758 #define vqdmlslh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56759   int32_t __ret; \
  56760   int32_t __s0 = __p0; \
  56761   int16_t __s1 = __p1; \
  56762   int16x4_t __s2 = __p2; \
  56763   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  56764   __ret = (int32_t) __builtin_neon_vqdmlslh_lane_s16(__s0, __s1, __rev2, __p3); \
  56765   __ret; \
  56766 })
  56767 #endif
  56768 
  56769 #ifdef __LITTLE_ENDIAN__
  56770 #define vqdmlsls_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56771   int64_t __ret; \
  56772   int64_t __s0 = __p0; \
  56773   int32_t __s1 = __p1; \
  56774   int32x4_t __s2 = __p2; \
  56775   __ret = (int64_t) __builtin_neon_vqdmlsls_laneq_s32(__s0, __s1, __s2, __p3); \
  56776   __ret; \
  56777 })
  56778 #else
  56779 #define vqdmlsls_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \
  56780   int64_t __ret; \
  56781   int64_t __s0 = __p0; \
  56782   int32_t __s1 = __p1; \
  56783   int32x4_t __s2 = __p2; \
  56784   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  56785   __ret = (int64_t) __builtin_neon_vqdmlsls_laneq_s32(__s0, __s1, __rev2, __p3); \
  56786   __ret; \
  56787 })
  56788 #endif
  56789 
  56790 #ifdef __LITTLE_ENDIAN__
  56791 #define vqdmlslh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56792   int32_t __ret; \
  56793   int32_t __s0 = __p0; \
  56794   int16_t __s1 = __p1; \
  56795   int16x8_t __s2 = __p2; \
  56796   __ret = (int32_t) __builtin_neon_vqdmlslh_laneq_s16(__s0, __s1, __s2, __p3); \
  56797   __ret; \
  56798 })
  56799 #else
  56800 #define vqdmlslh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \
  56801   int32_t __ret; \
  56802   int32_t __s0 = __p0; \
  56803   int16_t __s1 = __p1; \
  56804   int16x8_t __s2 = __p2; \
  56805   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \
  56806   __ret = (int32_t) __builtin_neon_vqdmlslh_laneq_s16(__s0, __s1, __rev2, __p3); \
  56807   __ret; \
  56808 })
  56809 #endif
  56810 
  56811 #ifdef __LITTLE_ENDIAN__
  56812 #define vqdmlsl_laneq_s32(__p0_648, __p1_648, __p2_648, __p3_648) __extension__ ({ \
  56813   int64x2_t __ret_648; \
  56814   int64x2_t __s0_648 = __p0_648; \
  56815   int32x2_t __s1_648 = __p1_648; \
  56816   int32x4_t __s2_648 = __p2_648; \
  56817   __ret_648 = vqdmlsl_s32(__s0_648, __s1_648, splat_laneq_s32(__s2_648, __p3_648)); \
  56818   __ret_648; \
  56819 })
  56820 #else
  56821 #define vqdmlsl_laneq_s32(__p0_649, __p1_649, __p2_649, __p3_649) __extension__ ({ \
  56822   int64x2_t __ret_649; \
  56823   int64x2_t __s0_649 = __p0_649; \
  56824   int32x2_t __s1_649 = __p1_649; \
  56825   int32x4_t __s2_649 = __p2_649; \
  56826   int64x2_t __rev0_649;  __rev0_649 = __builtin_shufflevector(__s0_649, __s0_649, 1, 0); \
  56827   int32x2_t __rev1_649;  __rev1_649 = __builtin_shufflevector(__s1_649, __s1_649, 1, 0); \
  56828   int32x4_t __rev2_649;  __rev2_649 = __builtin_shufflevector(__s2_649, __s2_649, 3, 2, 1, 0); \
  56829   __ret_649 = __noswap_vqdmlsl_s32(__rev0_649, __rev1_649, __noswap_splat_laneq_s32(__rev2_649, __p3_649)); \
  56830   __ret_649 = __builtin_shufflevector(__ret_649, __ret_649, 1, 0); \
  56831   __ret_649; \
  56832 })
  56833 #endif
  56834 
  56835 #ifdef __LITTLE_ENDIAN__
  56836 #define vqdmlsl_laneq_s16(__p0_650, __p1_650, __p2_650, __p3_650) __extension__ ({ \
  56837   int32x4_t __ret_650; \
  56838   int32x4_t __s0_650 = __p0_650; \
  56839   int16x4_t __s1_650 = __p1_650; \
  56840   int16x8_t __s2_650 = __p2_650; \
  56841   __ret_650 = vqdmlsl_s16(__s0_650, __s1_650, splat_laneq_s16(__s2_650, __p3_650)); \
  56842   __ret_650; \
  56843 })
  56844 #else
  56845 #define vqdmlsl_laneq_s16(__p0_651, __p1_651, __p2_651, __p3_651) __extension__ ({ \
  56846   int32x4_t __ret_651; \
  56847   int32x4_t __s0_651 = __p0_651; \
  56848   int16x4_t __s1_651 = __p1_651; \
  56849   int16x8_t __s2_651 = __p2_651; \
  56850   int32x4_t __rev0_651;  __rev0_651 = __builtin_shufflevector(__s0_651, __s0_651, 3, 2, 1, 0); \
  56851   int16x4_t __rev1_651;  __rev1_651 = __builtin_shufflevector(__s1_651, __s1_651, 3, 2, 1, 0); \
  56852   int16x8_t __rev2_651;  __rev2_651 = __builtin_shufflevector(__s2_651, __s2_651, 7, 6, 5, 4, 3, 2, 1, 0); \
  56853   __ret_651 = __noswap_vqdmlsl_s16(__rev0_651, __rev1_651, __noswap_splat_laneq_s16(__rev2_651, __p3_651)); \
  56854   __ret_651 = __builtin_shufflevector(__ret_651, __ret_651, 3, 2, 1, 0); \
  56855   __ret_651; \
  56856 })
  56857 #endif
  56858 
  56859 __ai __attribute__((target("neon"))) int32_t vqdmulhs_s32(int32_t __p0, int32_t __p1) {
  56860   int32_t __ret;
  56861   __ret = (int32_t) __builtin_neon_vqdmulhs_s32(__p0, __p1);
  56862   return __ret;
  56863 }
  56864 __ai __attribute__((target("neon"))) int16_t vqdmulhh_s16(int16_t __p0, int16_t __p1) {
  56865   int16_t __ret;
  56866   __ret = (int16_t) __builtin_neon_vqdmulhh_s16(__p0, __p1);
  56867   return __ret;
  56868 }
  56869 #ifdef __LITTLE_ENDIAN__
  56870 #define vqdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  56871   int32x4_t __ret; \
  56872   int32x4_t __s0 = __p0; \
  56873   int32x2_t __s1 = __p1; \
  56874   __ret = (int32x4_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 2); \
  56875   __ret; \
  56876 })
  56877 #else
  56878 #define vqdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  56879   int32x4_t __ret; \
  56880   int32x4_t __s0 = __p0; \
  56881   int32x2_t __s1 = __p1; \
  56882   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  56883   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  56884   __ret = (int32x4_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  56885   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  56886   __ret; \
  56887 })
  56888 #endif
  56889 
  56890 #ifdef __LITTLE_ENDIAN__
  56891 #define vqdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  56892   int16x8_t __ret; \
  56893   int16x8_t __s0 = __p0; \
  56894   int16x4_t __s1 = __p1; \
  56895   __ret = (int16x8_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 1); \
  56896   __ret; \
  56897 })
  56898 #else
  56899 #define vqdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  56900   int16x8_t __ret; \
  56901   int16x8_t __s0 = __p0; \
  56902   int16x4_t __s1 = __p1; \
  56903   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  56904   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  56905   __ret = (int16x8_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  56906   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  56907   __ret; \
  56908 })
  56909 #endif
  56910 
  56911 #ifdef __LITTLE_ENDIAN__
  56912 #define vqdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  56913   int32x2_t __ret; \
  56914   int32x2_t __s0 = __p0; \
  56915   int32x2_t __s1 = __p1; \
  56916   __ret = (int32x2_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  56917   __ret; \
  56918 })
  56919 #else
  56920 #define vqdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  56921   int32x2_t __ret; \
  56922   int32x2_t __s0 = __p0; \
  56923   int32x2_t __s1 = __p1; \
  56924   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  56925   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  56926   __ret = (int32x2_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  56927   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  56928   __ret; \
  56929 })
  56930 #endif
  56931 
  56932 #ifdef __LITTLE_ENDIAN__
  56933 #define vqdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  56934   int16x4_t __ret; \
  56935   int16x4_t __s0 = __p0; \
  56936   int16x4_t __s1 = __p1; \
  56937   __ret = (int16x4_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  56938   __ret; \
  56939 })
  56940 #else
  56941 #define vqdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  56942   int16x4_t __ret; \
  56943   int16x4_t __s0 = __p0; \
  56944   int16x4_t __s1 = __p1; \
  56945   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  56946   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  56947   __ret = (int16x4_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  56948   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  56949   __ret; \
  56950 })
  56951 #endif
  56952 
  56953 #ifdef __LITTLE_ENDIAN__
  56954 #define vqdmulhs_lane_s32(__p0_652, __p1_652, __p2_652) __extension__ ({ \
  56955   int32_t __ret_652; \
  56956   int32_t __s0_652 = __p0_652; \
  56957   int32x2_t __s1_652 = __p1_652; \
  56958   __ret_652 = vqdmulhs_s32(__s0_652, vget_lane_s32(__s1_652, __p2_652)); \
  56959   __ret_652; \
  56960 })
  56961 #else
  56962 #define vqdmulhs_lane_s32(__p0_653, __p1_653, __p2_653) __extension__ ({ \
  56963   int32_t __ret_653; \
  56964   int32_t __s0_653 = __p0_653; \
  56965   int32x2_t __s1_653 = __p1_653; \
  56966   int32x2_t __rev1_653;  __rev1_653 = __builtin_shufflevector(__s1_653, __s1_653, 1, 0); \
  56967   __ret_653 = vqdmulhs_s32(__s0_653, __noswap_vget_lane_s32(__rev1_653, __p2_653)); \
  56968   __ret_653; \
  56969 })
  56970 #endif
  56971 
  56972 #ifdef __LITTLE_ENDIAN__
  56973 #define vqdmulhh_lane_s16(__p0_654, __p1_654, __p2_654) __extension__ ({ \
  56974   int16_t __ret_654; \
  56975   int16_t __s0_654 = __p0_654; \
  56976   int16x4_t __s1_654 = __p1_654; \
  56977   __ret_654 = vqdmulhh_s16(__s0_654, vget_lane_s16(__s1_654, __p2_654)); \
  56978   __ret_654; \
  56979 })
  56980 #else
  56981 #define vqdmulhh_lane_s16(__p0_655, __p1_655, __p2_655) __extension__ ({ \
  56982   int16_t __ret_655; \
  56983   int16_t __s0_655 = __p0_655; \
  56984   int16x4_t __s1_655 = __p1_655; \
  56985   int16x4_t __rev1_655;  __rev1_655 = __builtin_shufflevector(__s1_655, __s1_655, 3, 2, 1, 0); \
  56986   __ret_655 = vqdmulhh_s16(__s0_655, __noswap_vget_lane_s16(__rev1_655, __p2_655)); \
  56987   __ret_655; \
  56988 })
  56989 #endif
  56990 
  56991 #ifdef __LITTLE_ENDIAN__
  56992 #define vqdmulhs_laneq_s32(__p0_656, __p1_656, __p2_656) __extension__ ({ \
  56993   int32_t __ret_656; \
  56994   int32_t __s0_656 = __p0_656; \
  56995   int32x4_t __s1_656 = __p1_656; \
  56996   __ret_656 = vqdmulhs_s32(__s0_656, vgetq_lane_s32(__s1_656, __p2_656)); \
  56997   __ret_656; \
  56998 })
  56999 #else
  57000 #define vqdmulhs_laneq_s32(__p0_657, __p1_657, __p2_657) __extension__ ({ \
  57001   int32_t __ret_657; \
  57002   int32_t __s0_657 = __p0_657; \
  57003   int32x4_t __s1_657 = __p1_657; \
  57004   int32x4_t __rev1_657;  __rev1_657 = __builtin_shufflevector(__s1_657, __s1_657, 3, 2, 1, 0); \
  57005   __ret_657 = vqdmulhs_s32(__s0_657, __noswap_vgetq_lane_s32(__rev1_657, __p2_657)); \
  57006   __ret_657; \
  57007 })
  57008 #endif
  57009 
  57010 #ifdef __LITTLE_ENDIAN__
  57011 #define vqdmulhh_laneq_s16(__p0_658, __p1_658, __p2_658) __extension__ ({ \
  57012   int16_t __ret_658; \
  57013   int16_t __s0_658 = __p0_658; \
  57014   int16x8_t __s1_658 = __p1_658; \
  57015   __ret_658 = vqdmulhh_s16(__s0_658, vgetq_lane_s16(__s1_658, __p2_658)); \
  57016   __ret_658; \
  57017 })
  57018 #else
  57019 #define vqdmulhh_laneq_s16(__p0_659, __p1_659, __p2_659) __extension__ ({ \
  57020   int16_t __ret_659; \
  57021   int16_t __s0_659 = __p0_659; \
  57022   int16x8_t __s1_659 = __p1_659; \
  57023   int16x8_t __rev1_659;  __rev1_659 = __builtin_shufflevector(__s1_659, __s1_659, 7, 6, 5, 4, 3, 2, 1, 0); \
  57024   __ret_659 = vqdmulhh_s16(__s0_659, __noswap_vgetq_lane_s16(__rev1_659, __p2_659)); \
  57025   __ret_659; \
  57026 })
  57027 #endif
  57028 
  57029 #ifdef __LITTLE_ENDIAN__
  57030 #define vqdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57031   int32x4_t __ret; \
  57032   int32x4_t __s0 = __p0; \
  57033   int32x4_t __s1 = __p1; \
  57034   __ret = (int32x4_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  57035   __ret; \
  57036 })
  57037 #else
  57038 #define vqdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57039   int32x4_t __ret; \
  57040   int32x4_t __s0 = __p0; \
  57041   int32x4_t __s1 = __p1; \
  57042   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  57043   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  57044   __ret = (int32x4_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  57045   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  57046   __ret; \
  57047 })
  57048 #endif
  57049 
  57050 #ifdef __LITTLE_ENDIAN__
  57051 #define vqdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57052   int16x8_t __ret; \
  57053   int16x8_t __s0 = __p0; \
  57054   int16x8_t __s1 = __p1; \
  57055   __ret = (int16x8_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  57056   __ret; \
  57057 })
  57058 #else
  57059 #define vqdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57060   int16x8_t __ret; \
  57061   int16x8_t __s0 = __p0; \
  57062   int16x8_t __s1 = __p1; \
  57063   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  57064   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  57065   __ret = (int16x8_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  57066   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  57067   __ret; \
  57068 })
  57069 #endif
  57070 
  57071 #ifdef __LITTLE_ENDIAN__
  57072 #define vqdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57073   int32x2_t __ret; \
  57074   int32x2_t __s0 = __p0; \
  57075   int32x4_t __s1 = __p1; \
  57076   __ret = (int32x2_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 2); \
  57077   __ret; \
  57078 })
  57079 #else
  57080 #define vqdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57081   int32x2_t __ret; \
  57082   int32x2_t __s0 = __p0; \
  57083   int32x4_t __s1 = __p1; \
  57084   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  57085   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  57086   __ret = (int32x2_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 2); \
  57087   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  57088   __ret; \
  57089 })
  57090 #endif
  57091 
  57092 #ifdef __LITTLE_ENDIAN__
  57093 #define vqdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57094   int16x4_t __ret; \
  57095   int16x4_t __s0 = __p0; \
  57096   int16x8_t __s1 = __p1; \
  57097   __ret = (int16x4_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 1); \
  57098   __ret; \
  57099 })
  57100 #else
  57101 #define vqdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57102   int16x4_t __ret; \
  57103   int16x4_t __s0 = __p0; \
  57104   int16x8_t __s1 = __p1; \
  57105   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  57106   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  57107   __ret = (int16x4_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 1); \
  57108   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  57109   __ret; \
  57110 })
  57111 #endif
  57112 
  57113 __ai __attribute__((target("neon"))) int64_t vqdmulls_s32(int32_t __p0, int32_t __p1) {
  57114   int64_t __ret;
  57115   __ret = (int64_t) __builtin_neon_vqdmulls_s32(__p0, __p1);
  57116   return __ret;
  57117 }
  57118 __ai __attribute__((target("neon"))) int32_t vqdmullh_s16(int16_t __p0, int16_t __p1) {
  57119   int32_t __ret;
  57120   __ret = (int32_t) __builtin_neon_vqdmullh_s16(__p0, __p1);
  57121   return __ret;
  57122 }
  57123 #ifdef __LITTLE_ENDIAN__
  57124 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_s32(int32x4_t __p0, int32x4_t __p1) {
  57125   int64x2_t __ret;
  57126   __ret = vqdmull_s32(vget_high_s32(__p0), vget_high_s32(__p1));
  57127   return __ret;
  57128 }
  57129 #else
  57130 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_s32(int32x4_t __p0, int32x4_t __p1) {
  57131   int64x2_t __ret;
  57132   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  57133   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  57134   __ret = __noswap_vqdmull_s32(__noswap_vget_high_s32(__rev0), __noswap_vget_high_s32(__rev1));
  57135   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  57136   return __ret;
  57137 }
  57138 #endif
  57139 
  57140 #ifdef __LITTLE_ENDIAN__
  57141 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_s16(int16x8_t __p0, int16x8_t __p1) {
  57142   int32x4_t __ret;
  57143   __ret = vqdmull_s16(vget_high_s16(__p0), vget_high_s16(__p1));
  57144   return __ret;
  57145 }
  57146 #else
  57147 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_s16(int16x8_t __p0, int16x8_t __p1) {
  57148   int32x4_t __ret;
  57149   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  57150   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  57151   __ret = __noswap_vqdmull_s16(__noswap_vget_high_s16(__rev0), __noswap_vget_high_s16(__rev1));
  57152   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  57153   return __ret;
  57154 }
  57155 #endif
  57156 
  57157 #ifdef __LITTLE_ENDIAN__
  57158 #define vqdmull_high_lane_s32(__p0_660, __p1_660, __p2_660) __extension__ ({ \
  57159   int64x2_t __ret_660; \
  57160   int32x4_t __s0_660 = __p0_660; \
  57161   int32x2_t __s1_660 = __p1_660; \
  57162   __ret_660 = vqdmull_s32(vget_high_s32(__s0_660), splat_lane_s32(__s1_660, __p2_660)); \
  57163   __ret_660; \
  57164 })
  57165 #else
  57166 #define vqdmull_high_lane_s32(__p0_661, __p1_661, __p2_661) __extension__ ({ \
  57167   int64x2_t __ret_661; \
  57168   int32x4_t __s0_661 = __p0_661; \
  57169   int32x2_t __s1_661 = __p1_661; \
  57170   int32x4_t __rev0_661;  __rev0_661 = __builtin_shufflevector(__s0_661, __s0_661, 3, 2, 1, 0); \
  57171   int32x2_t __rev1_661;  __rev1_661 = __builtin_shufflevector(__s1_661, __s1_661, 1, 0); \
  57172   __ret_661 = __noswap_vqdmull_s32(__noswap_vget_high_s32(__rev0_661), __noswap_splat_lane_s32(__rev1_661, __p2_661)); \
  57173   __ret_661 = __builtin_shufflevector(__ret_661, __ret_661, 1, 0); \
  57174   __ret_661; \
  57175 })
  57176 #endif
  57177 
  57178 #ifdef __LITTLE_ENDIAN__
  57179 #define vqdmull_high_lane_s16(__p0_662, __p1_662, __p2_662) __extension__ ({ \
  57180   int32x4_t __ret_662; \
  57181   int16x8_t __s0_662 = __p0_662; \
  57182   int16x4_t __s1_662 = __p1_662; \
  57183   __ret_662 = vqdmull_s16(vget_high_s16(__s0_662), splat_lane_s16(__s1_662, __p2_662)); \
  57184   __ret_662; \
  57185 })
  57186 #else
  57187 #define vqdmull_high_lane_s16(__p0_663, __p1_663, __p2_663) __extension__ ({ \
  57188   int32x4_t __ret_663; \
  57189   int16x8_t __s0_663 = __p0_663; \
  57190   int16x4_t __s1_663 = __p1_663; \
  57191   int16x8_t __rev0_663;  __rev0_663 = __builtin_shufflevector(__s0_663, __s0_663, 7, 6, 5, 4, 3, 2, 1, 0); \
  57192   int16x4_t __rev1_663;  __rev1_663 = __builtin_shufflevector(__s1_663, __s1_663, 3, 2, 1, 0); \
  57193   __ret_663 = __noswap_vqdmull_s16(__noswap_vget_high_s16(__rev0_663), __noswap_splat_lane_s16(__rev1_663, __p2_663)); \
  57194   __ret_663 = __builtin_shufflevector(__ret_663, __ret_663, 3, 2, 1, 0); \
  57195   __ret_663; \
  57196 })
  57197 #endif
  57198 
  57199 #ifdef __LITTLE_ENDIAN__
  57200 #define vqdmull_high_laneq_s32(__p0_664, __p1_664, __p2_664) __extension__ ({ \
  57201   int64x2_t __ret_664; \
  57202   int32x4_t __s0_664 = __p0_664; \
  57203   int32x4_t __s1_664 = __p1_664; \
  57204   __ret_664 = vqdmull_s32(vget_high_s32(__s0_664), splat_laneq_s32(__s1_664, __p2_664)); \
  57205   __ret_664; \
  57206 })
  57207 #else
  57208 #define vqdmull_high_laneq_s32(__p0_665, __p1_665, __p2_665) __extension__ ({ \
  57209   int64x2_t __ret_665; \
  57210   int32x4_t __s0_665 = __p0_665; \
  57211   int32x4_t __s1_665 = __p1_665; \
  57212   int32x4_t __rev0_665;  __rev0_665 = __builtin_shufflevector(__s0_665, __s0_665, 3, 2, 1, 0); \
  57213   int32x4_t __rev1_665;  __rev1_665 = __builtin_shufflevector(__s1_665, __s1_665, 3, 2, 1, 0); \
  57214   __ret_665 = __noswap_vqdmull_s32(__noswap_vget_high_s32(__rev0_665), __noswap_splat_laneq_s32(__rev1_665, __p2_665)); \
  57215   __ret_665 = __builtin_shufflevector(__ret_665, __ret_665, 1, 0); \
  57216   __ret_665; \
  57217 })
  57218 #endif
  57219 
  57220 #ifdef __LITTLE_ENDIAN__
  57221 #define vqdmull_high_laneq_s16(__p0_666, __p1_666, __p2_666) __extension__ ({ \
  57222   int32x4_t __ret_666; \
  57223   int16x8_t __s0_666 = __p0_666; \
  57224   int16x8_t __s1_666 = __p1_666; \
  57225   __ret_666 = vqdmull_s16(vget_high_s16(__s0_666), splat_laneq_s16(__s1_666, __p2_666)); \
  57226   __ret_666; \
  57227 })
  57228 #else
  57229 #define vqdmull_high_laneq_s16(__p0_667, __p1_667, __p2_667) __extension__ ({ \
  57230   int32x4_t __ret_667; \
  57231   int16x8_t __s0_667 = __p0_667; \
  57232   int16x8_t __s1_667 = __p1_667; \
  57233   int16x8_t __rev0_667;  __rev0_667 = __builtin_shufflevector(__s0_667, __s0_667, 7, 6, 5, 4, 3, 2, 1, 0); \
  57234   int16x8_t __rev1_667;  __rev1_667 = __builtin_shufflevector(__s1_667, __s1_667, 7, 6, 5, 4, 3, 2, 1, 0); \
  57235   __ret_667 = __noswap_vqdmull_s16(__noswap_vget_high_s16(__rev0_667), __noswap_splat_laneq_s16(__rev1_667, __p2_667)); \
  57236   __ret_667 = __builtin_shufflevector(__ret_667, __ret_667, 3, 2, 1, 0); \
  57237   __ret_667; \
  57238 })
  57239 #endif
  57240 
  57241 #ifdef __LITTLE_ENDIAN__
  57242 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_n_s32(int32x4_t __p0, int32_t __p1) {
  57243   int64x2_t __ret;
  57244   __ret = vqdmull_n_s32(vget_high_s32(__p0), __p1);
  57245   return __ret;
  57246 }
  57247 #else
  57248 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_n_s32(int32x4_t __p0, int32_t __p1) {
  57249   int64x2_t __ret;
  57250   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  57251   __ret = __noswap_vqdmull_n_s32(__noswap_vget_high_s32(__rev0), __p1);
  57252   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  57253   return __ret;
  57254 }
  57255 #endif
  57256 
  57257 #ifdef __LITTLE_ENDIAN__
  57258 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_n_s16(int16x8_t __p0, int16_t __p1) {
  57259   int32x4_t __ret;
  57260   __ret = vqdmull_n_s16(vget_high_s16(__p0), __p1);
  57261   return __ret;
  57262 }
  57263 #else
  57264 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_n_s16(int16x8_t __p0, int16_t __p1) {
  57265   int32x4_t __ret;
  57266   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  57267   __ret = __noswap_vqdmull_n_s16(__noswap_vget_high_s16(__rev0), __p1);
  57268   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  57269   return __ret;
  57270 }
  57271 #endif
  57272 
  57273 #ifdef __LITTLE_ENDIAN__
  57274 #define vqdmulls_lane_s32(__p0_668, __p1_668, __p2_668) __extension__ ({ \
  57275   int64_t __ret_668; \
  57276   int32_t __s0_668 = __p0_668; \
  57277   int32x2_t __s1_668 = __p1_668; \
  57278   __ret_668 = vqdmulls_s32(__s0_668, vget_lane_s32(__s1_668, __p2_668)); \
  57279   __ret_668; \
  57280 })
  57281 #else
  57282 #define vqdmulls_lane_s32(__p0_669, __p1_669, __p2_669) __extension__ ({ \
  57283   int64_t __ret_669; \
  57284   int32_t __s0_669 = __p0_669; \
  57285   int32x2_t __s1_669 = __p1_669; \
  57286   int32x2_t __rev1_669;  __rev1_669 = __builtin_shufflevector(__s1_669, __s1_669, 1, 0); \
  57287   __ret_669 = vqdmulls_s32(__s0_669, __noswap_vget_lane_s32(__rev1_669, __p2_669)); \
  57288   __ret_669; \
  57289 })
  57290 #endif
  57291 
  57292 #ifdef __LITTLE_ENDIAN__
  57293 #define vqdmullh_lane_s16(__p0_670, __p1_670, __p2_670) __extension__ ({ \
  57294   int32_t __ret_670; \
  57295   int16_t __s0_670 = __p0_670; \
  57296   int16x4_t __s1_670 = __p1_670; \
  57297   __ret_670 = vqdmullh_s16(__s0_670, vget_lane_s16(__s1_670, __p2_670)); \
  57298   __ret_670; \
  57299 })
  57300 #else
  57301 #define vqdmullh_lane_s16(__p0_671, __p1_671, __p2_671) __extension__ ({ \
  57302   int32_t __ret_671; \
  57303   int16_t __s0_671 = __p0_671; \
  57304   int16x4_t __s1_671 = __p1_671; \
  57305   int16x4_t __rev1_671;  __rev1_671 = __builtin_shufflevector(__s1_671, __s1_671, 3, 2, 1, 0); \
  57306   __ret_671 = vqdmullh_s16(__s0_671, __noswap_vget_lane_s16(__rev1_671, __p2_671)); \
  57307   __ret_671; \
  57308 })
  57309 #endif
  57310 
  57311 #ifdef __LITTLE_ENDIAN__
  57312 #define vqdmulls_laneq_s32(__p0_672, __p1_672, __p2_672) __extension__ ({ \
  57313   int64_t __ret_672; \
  57314   int32_t __s0_672 = __p0_672; \
  57315   int32x4_t __s1_672 = __p1_672; \
  57316   __ret_672 = vqdmulls_s32(__s0_672, vgetq_lane_s32(__s1_672, __p2_672)); \
  57317   __ret_672; \
  57318 })
  57319 #else
  57320 #define vqdmulls_laneq_s32(__p0_673, __p1_673, __p2_673) __extension__ ({ \
  57321   int64_t __ret_673; \
  57322   int32_t __s0_673 = __p0_673; \
  57323   int32x4_t __s1_673 = __p1_673; \
  57324   int32x4_t __rev1_673;  __rev1_673 = __builtin_shufflevector(__s1_673, __s1_673, 3, 2, 1, 0); \
  57325   __ret_673 = vqdmulls_s32(__s0_673, __noswap_vgetq_lane_s32(__rev1_673, __p2_673)); \
  57326   __ret_673; \
  57327 })
  57328 #endif
  57329 
  57330 #ifdef __LITTLE_ENDIAN__
  57331 #define vqdmullh_laneq_s16(__p0_674, __p1_674, __p2_674) __extension__ ({ \
  57332   int32_t __ret_674; \
  57333   int16_t __s0_674 = __p0_674; \
  57334   int16x8_t __s1_674 = __p1_674; \
  57335   __ret_674 = vqdmullh_s16(__s0_674, vgetq_lane_s16(__s1_674, __p2_674)); \
  57336   __ret_674; \
  57337 })
  57338 #else
  57339 #define vqdmullh_laneq_s16(__p0_675, __p1_675, __p2_675) __extension__ ({ \
  57340   int32_t __ret_675; \
  57341   int16_t __s0_675 = __p0_675; \
  57342   int16x8_t __s1_675 = __p1_675; \
  57343   int16x8_t __rev1_675;  __rev1_675 = __builtin_shufflevector(__s1_675, __s1_675, 7, 6, 5, 4, 3, 2, 1, 0); \
  57344   __ret_675 = vqdmullh_s16(__s0_675, __noswap_vgetq_lane_s16(__rev1_675, __p2_675)); \
  57345   __ret_675; \
  57346 })
  57347 #endif
  57348 
  57349 #ifdef __LITTLE_ENDIAN__
  57350 #define vqdmull_laneq_s32(__p0_676, __p1_676, __p2_676) __extension__ ({ \
  57351   int64x2_t __ret_676; \
  57352   int32x2_t __s0_676 = __p0_676; \
  57353   int32x4_t __s1_676 = __p1_676; \
  57354   __ret_676 = vqdmull_s32(__s0_676, splat_laneq_s32(__s1_676, __p2_676)); \
  57355   __ret_676; \
  57356 })
  57357 #else
  57358 #define vqdmull_laneq_s32(__p0_677, __p1_677, __p2_677) __extension__ ({ \
  57359   int64x2_t __ret_677; \
  57360   int32x2_t __s0_677 = __p0_677; \
  57361   int32x4_t __s1_677 = __p1_677; \
  57362   int32x2_t __rev0_677;  __rev0_677 = __builtin_shufflevector(__s0_677, __s0_677, 1, 0); \
  57363   int32x4_t __rev1_677;  __rev1_677 = __builtin_shufflevector(__s1_677, __s1_677, 3, 2, 1, 0); \
  57364   __ret_677 = __noswap_vqdmull_s32(__rev0_677, __noswap_splat_laneq_s32(__rev1_677, __p2_677)); \
  57365   __ret_677 = __builtin_shufflevector(__ret_677, __ret_677, 1, 0); \
  57366   __ret_677; \
  57367 })
  57368 #endif
  57369 
  57370 #ifdef __LITTLE_ENDIAN__
  57371 #define vqdmull_laneq_s16(__p0_678, __p1_678, __p2_678) __extension__ ({ \
  57372   int32x4_t __ret_678; \
  57373   int16x4_t __s0_678 = __p0_678; \
  57374   int16x8_t __s1_678 = __p1_678; \
  57375   __ret_678 = vqdmull_s16(__s0_678, splat_laneq_s16(__s1_678, __p2_678)); \
  57376   __ret_678; \
  57377 })
  57378 #else
  57379 #define vqdmull_laneq_s16(__p0_679, __p1_679, __p2_679) __extension__ ({ \
  57380   int32x4_t __ret_679; \
  57381   int16x4_t __s0_679 = __p0_679; \
  57382   int16x8_t __s1_679 = __p1_679; \
  57383   int16x4_t __rev0_679;  __rev0_679 = __builtin_shufflevector(__s0_679, __s0_679, 3, 2, 1, 0); \
  57384   int16x8_t __rev1_679;  __rev1_679 = __builtin_shufflevector(__s1_679, __s1_679, 7, 6, 5, 4, 3, 2, 1, 0); \
  57385   __ret_679 = __noswap_vqdmull_s16(__rev0_679, __noswap_splat_laneq_s16(__rev1_679, __p2_679)); \
  57386   __ret_679 = __builtin_shufflevector(__ret_679, __ret_679, 3, 2, 1, 0); \
  57387   __ret_679; \
  57388 })
  57389 #endif
  57390 
  57391 __ai __attribute__((target("neon"))) int16_t vqmovns_s32(int32_t __p0) {
  57392   int16_t __ret;
  57393   __ret = (int16_t) __builtin_neon_vqmovns_s32(__p0);
  57394   return __ret;
  57395 }
  57396 __ai __attribute__((target("neon"))) int32_t vqmovnd_s64(int64_t __p0) {
  57397   int32_t __ret;
  57398   __ret = (int32_t) __builtin_neon_vqmovnd_s64(__p0);
  57399   return __ret;
  57400 }
  57401 __ai __attribute__((target("neon"))) int8_t vqmovnh_s16(int16_t __p0) {
  57402   int8_t __ret;
  57403   __ret = (int8_t) __builtin_neon_vqmovnh_s16(__p0);
  57404   return __ret;
  57405 }
  57406 __ai __attribute__((target("neon"))) uint16_t vqmovns_u32(uint32_t __p0) {
  57407   uint16_t __ret;
  57408   __ret = (uint16_t) __builtin_neon_vqmovns_u32(__p0);
  57409   return __ret;
  57410 }
  57411 __ai __attribute__((target("neon"))) uint32_t vqmovnd_u64(uint64_t __p0) {
  57412   uint32_t __ret;
  57413   __ret = (uint32_t) __builtin_neon_vqmovnd_u64(__p0);
  57414   return __ret;
  57415 }
  57416 __ai __attribute__((target("neon"))) uint8_t vqmovnh_u16(uint16_t __p0) {
  57417   uint8_t __ret;
  57418   __ret = (uint8_t) __builtin_neon_vqmovnh_u16(__p0);
  57419   return __ret;
  57420 }
  57421 #ifdef __LITTLE_ENDIAN__
  57422 __ai __attribute__((target("neon"))) uint16x8_t vqmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) {
  57423   uint16x8_t __ret;
  57424   __ret = vcombine_u16(__p0, vqmovn_u32(__p1));
  57425   return __ret;
  57426 }
  57427 #else
  57428 __ai __attribute__((target("neon"))) uint16x8_t vqmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) {
  57429   uint16x8_t __ret;
  57430   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  57431   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  57432   __ret = __noswap_vcombine_u16(__rev0, __noswap_vqmovn_u32(__rev1));
  57433   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  57434   return __ret;
  57435 }
  57436 #endif
  57437 
  57438 #ifdef __LITTLE_ENDIAN__
  57439 __ai __attribute__((target("neon"))) uint32x4_t vqmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) {
  57440   uint32x4_t __ret;
  57441   __ret = vcombine_u32(__p0, vqmovn_u64(__p1));
  57442   return __ret;
  57443 }
  57444 #else
  57445 __ai __attribute__((target("neon"))) uint32x4_t vqmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) {
  57446   uint32x4_t __ret;
  57447   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  57448   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  57449   __ret = __noswap_vcombine_u32(__rev0, __noswap_vqmovn_u64(__rev1));
  57450   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  57451   return __ret;
  57452 }
  57453 #endif
  57454 
  57455 #ifdef __LITTLE_ENDIAN__
  57456 __ai __attribute__((target("neon"))) uint8x16_t vqmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) {
  57457   uint8x16_t __ret;
  57458   __ret = vcombine_u8(__p0, vqmovn_u16(__p1));
  57459   return __ret;
  57460 }
  57461 #else
  57462 __ai __attribute__((target("neon"))) uint8x16_t vqmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) {
  57463   uint8x16_t __ret;
  57464   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  57465   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  57466   __ret = __noswap_vcombine_u8(__rev0, __noswap_vqmovn_u16(__rev1));
  57467   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  57468   return __ret;
  57469 }
  57470 #endif
  57471 
  57472 #ifdef __LITTLE_ENDIAN__
  57473 __ai __attribute__((target("neon"))) int16x8_t vqmovn_high_s32(int16x4_t __p0, int32x4_t __p1) {
  57474   int16x8_t __ret;
  57475   __ret = vcombine_s16(__p0, vqmovn_s32(__p1));
  57476   return __ret;
  57477 }
  57478 #else
  57479 __ai __attribute__((target("neon"))) int16x8_t vqmovn_high_s32(int16x4_t __p0, int32x4_t __p1) {
  57480   int16x8_t __ret;
  57481   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  57482   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  57483   __ret = __noswap_vcombine_s16(__rev0, __noswap_vqmovn_s32(__rev1));
  57484   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  57485   return __ret;
  57486 }
  57487 #endif
  57488 
  57489 #ifdef __LITTLE_ENDIAN__
  57490 __ai __attribute__((target("neon"))) int32x4_t vqmovn_high_s64(int32x2_t __p0, int64x2_t __p1) {
  57491   int32x4_t __ret;
  57492   __ret = vcombine_s32(__p0, vqmovn_s64(__p1));
  57493   return __ret;
  57494 }
  57495 #else
  57496 __ai __attribute__((target("neon"))) int32x4_t vqmovn_high_s64(int32x2_t __p0, int64x2_t __p1) {
  57497   int32x4_t __ret;
  57498   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  57499   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  57500   __ret = __noswap_vcombine_s32(__rev0, __noswap_vqmovn_s64(__rev1));
  57501   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  57502   return __ret;
  57503 }
  57504 #endif
  57505 
  57506 #ifdef __LITTLE_ENDIAN__
  57507 __ai __attribute__((target("neon"))) int8x16_t vqmovn_high_s16(int8x8_t __p0, int16x8_t __p1) {
  57508   int8x16_t __ret;
  57509   __ret = vcombine_s8(__p0, vqmovn_s16(__p1));
  57510   return __ret;
  57511 }
  57512 #else
  57513 __ai __attribute__((target("neon"))) int8x16_t vqmovn_high_s16(int8x8_t __p0, int16x8_t __p1) {
  57514   int8x16_t __ret;
  57515   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  57516   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  57517   __ret = __noswap_vcombine_s8(__rev0, __noswap_vqmovn_s16(__rev1));
  57518   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  57519   return __ret;
  57520 }
  57521 #endif
  57522 
  57523 __ai __attribute__((target("neon"))) uint16_t vqmovuns_s32(int32_t __p0) {
  57524   uint16_t __ret;
  57525   __ret = (uint16_t) __builtin_neon_vqmovuns_s32(__p0);
  57526   return __ret;
  57527 }
  57528 __ai __attribute__((target("neon"))) uint32_t vqmovund_s64(int64_t __p0) {
  57529   uint32_t __ret;
  57530   __ret = (uint32_t) __builtin_neon_vqmovund_s64(__p0);
  57531   return __ret;
  57532 }
  57533 __ai __attribute__((target("neon"))) uint8_t vqmovunh_s16(int16_t __p0) {
  57534   uint8_t __ret;
  57535   __ret = (uint8_t) __builtin_neon_vqmovunh_s16(__p0);
  57536   return __ret;
  57537 }
  57538 #ifdef __LITTLE_ENDIAN__
  57539 __ai __attribute__((target("neon"))) uint16x8_t vqmovun_high_s32(uint16x4_t __p0, int32x4_t __p1) {
  57540   uint16x8_t __ret;
  57541   __ret = vcombine_u16((uint16x4_t)(__p0), vqmovun_s32(__p1));
  57542   return __ret;
  57543 }
  57544 #else
  57545 __ai __attribute__((target("neon"))) uint16x8_t vqmovun_high_s32(uint16x4_t __p0, int32x4_t __p1) {
  57546   uint16x8_t __ret;
  57547   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  57548   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  57549   __ret = __noswap_vcombine_u16((uint16x4_t)(__rev0), __noswap_vqmovun_s32(__rev1));
  57550   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  57551   return __ret;
  57552 }
  57553 #endif
  57554 
  57555 #ifdef __LITTLE_ENDIAN__
  57556 __ai __attribute__((target("neon"))) uint32x4_t vqmovun_high_s64(uint32x2_t __p0, int64x2_t __p1) {
  57557   uint32x4_t __ret;
  57558   __ret = vcombine_u32((uint32x2_t)(__p0), vqmovun_s64(__p1));
  57559   return __ret;
  57560 }
  57561 #else
  57562 __ai __attribute__((target("neon"))) uint32x4_t vqmovun_high_s64(uint32x2_t __p0, int64x2_t __p1) {
  57563   uint32x4_t __ret;
  57564   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  57565   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  57566   __ret = __noswap_vcombine_u32((uint32x2_t)(__rev0), __noswap_vqmovun_s64(__rev1));
  57567   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  57568   return __ret;
  57569 }
  57570 #endif
  57571 
  57572 #ifdef __LITTLE_ENDIAN__
  57573 __ai __attribute__((target("neon"))) uint8x16_t vqmovun_high_s16(uint8x8_t __p0, int16x8_t __p1) {
  57574   uint8x16_t __ret;
  57575   __ret = vcombine_u8((uint8x8_t)(__p0), vqmovun_s16(__p1));
  57576   return __ret;
  57577 }
  57578 #else
  57579 __ai __attribute__((target("neon"))) uint8x16_t vqmovun_high_s16(uint8x8_t __p0, int16x8_t __p1) {
  57580   uint8x16_t __ret;
  57581   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  57582   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  57583   __ret = __noswap_vcombine_u8((uint8x8_t)(__rev0), __noswap_vqmovun_s16(__rev1));
  57584   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  57585   return __ret;
  57586 }
  57587 #endif
  57588 
  57589 #ifdef __LITTLE_ENDIAN__
  57590 __ai __attribute__((target("neon"))) int64x2_t vqnegq_s64(int64x2_t __p0) {
  57591   int64x2_t __ret;
  57592   __ret = (int64x2_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 35);
  57593   return __ret;
  57594 }
  57595 #else
  57596 __ai __attribute__((target("neon"))) int64x2_t vqnegq_s64(int64x2_t __p0) {
  57597   int64x2_t __ret;
  57598   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  57599   __ret = (int64x2_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 35);
  57600   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  57601   return __ret;
  57602 }
  57603 #endif
  57604 
  57605 __ai __attribute__((target("neon"))) int64x1_t vqneg_s64(int64x1_t __p0) {
  57606   int64x1_t __ret;
  57607   __ret = (int64x1_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 3);
  57608   return __ret;
  57609 }
  57610 __ai __attribute__((target("neon"))) int8_t vqnegb_s8(int8_t __p0) {
  57611   int8_t __ret;
  57612   __ret = (int8_t) __builtin_neon_vqnegb_s8(__p0);
  57613   return __ret;
  57614 }
  57615 __ai __attribute__((target("neon"))) int32_t vqnegs_s32(int32_t __p0) {
  57616   int32_t __ret;
  57617   __ret = (int32_t) __builtin_neon_vqnegs_s32(__p0);
  57618   return __ret;
  57619 }
  57620 __ai __attribute__((target("neon"))) int64_t vqnegd_s64(int64_t __p0) {
  57621   int64_t __ret;
  57622   __ret = (int64_t) __builtin_neon_vqnegd_s64(__p0);
  57623   return __ret;
  57624 }
  57625 __ai __attribute__((target("neon"))) int16_t vqnegh_s16(int16_t __p0) {
  57626   int16_t __ret;
  57627   __ret = (int16_t) __builtin_neon_vqnegh_s16(__p0);
  57628   return __ret;
  57629 }
  57630 __ai __attribute__((target("neon"))) int32_t vqrdmulhs_s32(int32_t __p0, int32_t __p1) {
  57631   int32_t __ret;
  57632   __ret = (int32_t) __builtin_neon_vqrdmulhs_s32(__p0, __p1);
  57633   return __ret;
  57634 }
  57635 __ai __attribute__((target("neon"))) int16_t vqrdmulhh_s16(int16_t __p0, int16_t __p1) {
  57636   int16_t __ret;
  57637   __ret = (int16_t) __builtin_neon_vqrdmulhh_s16(__p0, __p1);
  57638   return __ret;
  57639 }
  57640 #ifdef __LITTLE_ENDIAN__
  57641 #define vqrdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  57642   int32x4_t __ret; \
  57643   int32x4_t __s0 = __p0; \
  57644   int32x2_t __s1 = __p1; \
  57645   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 2); \
  57646   __ret; \
  57647 })
  57648 #else
  57649 #define vqrdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  57650   int32x4_t __ret; \
  57651   int32x4_t __s0 = __p0; \
  57652   int32x2_t __s1 = __p1; \
  57653   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  57654   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  57655   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  57656   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  57657   __ret; \
  57658 })
  57659 #endif
  57660 
  57661 #ifdef __LITTLE_ENDIAN__
  57662 #define vqrdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  57663   int16x8_t __ret; \
  57664   int16x8_t __s0 = __p0; \
  57665   int16x4_t __s1 = __p1; \
  57666   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 1); \
  57667   __ret; \
  57668 })
  57669 #else
  57670 #define vqrdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  57671   int16x8_t __ret; \
  57672   int16x8_t __s0 = __p0; \
  57673   int16x4_t __s1 = __p1; \
  57674   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  57675   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  57676   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  57677   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  57678   __ret; \
  57679 })
  57680 #endif
  57681 
  57682 #ifdef __LITTLE_ENDIAN__
  57683 #define vqrdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  57684   int32x2_t __ret; \
  57685   int32x2_t __s0 = __p0; \
  57686   int32x2_t __s1 = __p1; \
  57687   __ret = (int32x2_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \
  57688   __ret; \
  57689 })
  57690 #else
  57691 #define vqrdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \
  57692   int32x2_t __ret; \
  57693   int32x2_t __s0 = __p0; \
  57694   int32x2_t __s1 = __p1; \
  57695   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  57696   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  57697   __ret = (int32x2_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \
  57698   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  57699   __ret; \
  57700 })
  57701 #endif
  57702 
  57703 #ifdef __LITTLE_ENDIAN__
  57704 #define vqrdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  57705   int16x4_t __ret; \
  57706   int16x4_t __s0 = __p0; \
  57707   int16x4_t __s1 = __p1; \
  57708   __ret = (int16x4_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \
  57709   __ret; \
  57710 })
  57711 #else
  57712 #define vqrdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \
  57713   int16x4_t __ret; \
  57714   int16x4_t __s0 = __p0; \
  57715   int16x4_t __s1 = __p1; \
  57716   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  57717   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  57718   __ret = (int16x4_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \
  57719   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  57720   __ret; \
  57721 })
  57722 #endif
  57723 
  57724 #ifdef __LITTLE_ENDIAN__
  57725 #define vqrdmulhs_lane_s32(__p0_680, __p1_680, __p2_680) __extension__ ({ \
  57726   int32_t __ret_680; \
  57727   int32_t __s0_680 = __p0_680; \
  57728   int32x2_t __s1_680 = __p1_680; \
  57729   __ret_680 = vqrdmulhs_s32(__s0_680, vget_lane_s32(__s1_680, __p2_680)); \
  57730   __ret_680; \
  57731 })
  57732 #else
  57733 #define vqrdmulhs_lane_s32(__p0_681, __p1_681, __p2_681) __extension__ ({ \
  57734   int32_t __ret_681; \
  57735   int32_t __s0_681 = __p0_681; \
  57736   int32x2_t __s1_681 = __p1_681; \
  57737   int32x2_t __rev1_681;  __rev1_681 = __builtin_shufflevector(__s1_681, __s1_681, 1, 0); \
  57738   __ret_681 = vqrdmulhs_s32(__s0_681, __noswap_vget_lane_s32(__rev1_681, __p2_681)); \
  57739   __ret_681; \
  57740 })
  57741 #endif
  57742 
  57743 #ifdef __LITTLE_ENDIAN__
  57744 #define vqrdmulhh_lane_s16(__p0_682, __p1_682, __p2_682) __extension__ ({ \
  57745   int16_t __ret_682; \
  57746   int16_t __s0_682 = __p0_682; \
  57747   int16x4_t __s1_682 = __p1_682; \
  57748   __ret_682 = vqrdmulhh_s16(__s0_682, vget_lane_s16(__s1_682, __p2_682)); \
  57749   __ret_682; \
  57750 })
  57751 #else
  57752 #define vqrdmulhh_lane_s16(__p0_683, __p1_683, __p2_683) __extension__ ({ \
  57753   int16_t __ret_683; \
  57754   int16_t __s0_683 = __p0_683; \
  57755   int16x4_t __s1_683 = __p1_683; \
  57756   int16x4_t __rev1_683;  __rev1_683 = __builtin_shufflevector(__s1_683, __s1_683, 3, 2, 1, 0); \
  57757   __ret_683 = vqrdmulhh_s16(__s0_683, __noswap_vget_lane_s16(__rev1_683, __p2_683)); \
  57758   __ret_683; \
  57759 })
  57760 #endif
  57761 
  57762 #ifdef __LITTLE_ENDIAN__
  57763 #define vqrdmulhs_laneq_s32(__p0_684, __p1_684, __p2_684) __extension__ ({ \
  57764   int32_t __ret_684; \
  57765   int32_t __s0_684 = __p0_684; \
  57766   int32x4_t __s1_684 = __p1_684; \
  57767   __ret_684 = vqrdmulhs_s32(__s0_684, vgetq_lane_s32(__s1_684, __p2_684)); \
  57768   __ret_684; \
  57769 })
  57770 #else
  57771 #define vqrdmulhs_laneq_s32(__p0_685, __p1_685, __p2_685) __extension__ ({ \
  57772   int32_t __ret_685; \
  57773   int32_t __s0_685 = __p0_685; \
  57774   int32x4_t __s1_685 = __p1_685; \
  57775   int32x4_t __rev1_685;  __rev1_685 = __builtin_shufflevector(__s1_685, __s1_685, 3, 2, 1, 0); \
  57776   __ret_685 = vqrdmulhs_s32(__s0_685, __noswap_vgetq_lane_s32(__rev1_685, __p2_685)); \
  57777   __ret_685; \
  57778 })
  57779 #endif
  57780 
  57781 #ifdef __LITTLE_ENDIAN__
  57782 #define vqrdmulhh_laneq_s16(__p0_686, __p1_686, __p2_686) __extension__ ({ \
  57783   int16_t __ret_686; \
  57784   int16_t __s0_686 = __p0_686; \
  57785   int16x8_t __s1_686 = __p1_686; \
  57786   __ret_686 = vqrdmulhh_s16(__s0_686, vgetq_lane_s16(__s1_686, __p2_686)); \
  57787   __ret_686; \
  57788 })
  57789 #else
  57790 #define vqrdmulhh_laneq_s16(__p0_687, __p1_687, __p2_687) __extension__ ({ \
  57791   int16_t __ret_687; \
  57792   int16_t __s0_687 = __p0_687; \
  57793   int16x8_t __s1_687 = __p1_687; \
  57794   int16x8_t __rev1_687;  __rev1_687 = __builtin_shufflevector(__s1_687, __s1_687, 7, 6, 5, 4, 3, 2, 1, 0); \
  57795   __ret_687 = vqrdmulhh_s16(__s0_687, __noswap_vgetq_lane_s16(__rev1_687, __p2_687)); \
  57796   __ret_687; \
  57797 })
  57798 #endif
  57799 
  57800 #ifdef __LITTLE_ENDIAN__
  57801 #define vqrdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57802   int32x4_t __ret; \
  57803   int32x4_t __s0 = __p0; \
  57804   int32x4_t __s1 = __p1; \
  57805   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \
  57806   __ret; \
  57807 })
  57808 #else
  57809 #define vqrdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57810   int32x4_t __ret; \
  57811   int32x4_t __s0 = __p0; \
  57812   int32x4_t __s1 = __p1; \
  57813   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  57814   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  57815   __ret = (int32x4_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \
  57816   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  57817   __ret; \
  57818 })
  57819 #endif
  57820 
  57821 #ifdef __LITTLE_ENDIAN__
  57822 #define vqrdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57823   int16x8_t __ret; \
  57824   int16x8_t __s0 = __p0; \
  57825   int16x8_t __s1 = __p1; \
  57826   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \
  57827   __ret; \
  57828 })
  57829 #else
  57830 #define vqrdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57831   int16x8_t __ret; \
  57832   int16x8_t __s0 = __p0; \
  57833   int16x8_t __s1 = __p1; \
  57834   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \
  57835   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  57836   __ret = (int16x8_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \
  57837   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \
  57838   __ret; \
  57839 })
  57840 #endif
  57841 
  57842 #ifdef __LITTLE_ENDIAN__
  57843 #define vqrdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57844   int32x2_t __ret; \
  57845   int32x2_t __s0 = __p0; \
  57846   int32x4_t __s1 = __p1; \
  57847   __ret = (int32x2_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 2); \
  57848   __ret; \
  57849 })
  57850 #else
  57851 #define vqrdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \
  57852   int32x2_t __ret; \
  57853   int32x2_t __s0 = __p0; \
  57854   int32x4_t __s1 = __p1; \
  57855   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  57856   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  57857   __ret = (int32x2_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 2); \
  57858   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  57859   __ret; \
  57860 })
  57861 #endif
  57862 
  57863 #ifdef __LITTLE_ENDIAN__
  57864 #define vqrdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57865   int16x4_t __ret; \
  57866   int16x4_t __s0 = __p0; \
  57867   int16x8_t __s1 = __p1; \
  57868   __ret = (int16x4_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 1); \
  57869   __ret; \
  57870 })
  57871 #else
  57872 #define vqrdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \
  57873   int16x4_t __ret; \
  57874   int16x4_t __s0 = __p0; \
  57875   int16x8_t __s1 = __p1; \
  57876   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  57877   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \
  57878   __ret = (int16x4_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 1); \
  57879   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  57880   __ret; \
  57881 })
  57882 #endif
  57883 
  57884 __ai __attribute__((target("neon"))) uint8_t vqrshlb_u8(uint8_t __p0, int8_t __p1) {
  57885   uint8_t __ret;
  57886   __ret = (uint8_t) __builtin_neon_vqrshlb_u8(__p0, __p1);
  57887   return __ret;
  57888 }
  57889 __ai __attribute__((target("neon"))) uint32_t vqrshls_u32(uint32_t __p0, int32_t __p1) {
  57890   uint32_t __ret;
  57891   __ret = (uint32_t) __builtin_neon_vqrshls_u32(__p0, __p1);
  57892   return __ret;
  57893 }
  57894 __ai __attribute__((target("neon"))) uint64_t vqrshld_u64(uint64_t __p0, int64_t __p1) {
  57895   uint64_t __ret;
  57896   __ret = (uint64_t) __builtin_neon_vqrshld_u64(__p0, __p1);
  57897   return __ret;
  57898 }
  57899 __ai __attribute__((target("neon"))) uint16_t vqrshlh_u16(uint16_t __p0, int16_t __p1) {
  57900   uint16_t __ret;
  57901   __ret = (uint16_t) __builtin_neon_vqrshlh_u16(__p0, __p1);
  57902   return __ret;
  57903 }
  57904 __ai __attribute__((target("neon"))) int8_t vqrshlb_s8(int8_t __p0, int8_t __p1) {
  57905   int8_t __ret;
  57906   __ret = (int8_t) __builtin_neon_vqrshlb_s8(__p0, __p1);
  57907   return __ret;
  57908 }
  57909 __ai __attribute__((target("neon"))) int32_t vqrshls_s32(int32_t __p0, int32_t __p1) {
  57910   int32_t __ret;
  57911   __ret = (int32_t) __builtin_neon_vqrshls_s32(__p0, __p1);
  57912   return __ret;
  57913 }
  57914 __ai __attribute__((target("neon"))) int64_t vqrshld_s64(int64_t __p0, int64_t __p1) {
  57915   int64_t __ret;
  57916   __ret = (int64_t) __builtin_neon_vqrshld_s64(__p0, __p1);
  57917   return __ret;
  57918 }
  57919 __ai __attribute__((target("neon"))) int16_t vqrshlh_s16(int16_t __p0, int16_t __p1) {
  57920   int16_t __ret;
  57921   __ret = (int16_t) __builtin_neon_vqrshlh_s16(__p0, __p1);
  57922   return __ret;
  57923 }
  57924 #ifdef __LITTLE_ENDIAN__
  57925 #define vqrshrn_high_n_u32(__p0_688, __p1_688, __p2_688) __extension__ ({ \
  57926   uint16x8_t __ret_688; \
  57927   uint16x4_t __s0_688 = __p0_688; \
  57928   uint32x4_t __s1_688 = __p1_688; \
  57929   __ret_688 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_688), (uint16x4_t)(vqrshrn_n_u32(__s1_688, __p2_688)))); \
  57930   __ret_688; \
  57931 })
  57932 #else
  57933 #define vqrshrn_high_n_u32(__p0_689, __p1_689, __p2_689) __extension__ ({ \
  57934   uint16x8_t __ret_689; \
  57935   uint16x4_t __s0_689 = __p0_689; \
  57936   uint32x4_t __s1_689 = __p1_689; \
  57937   uint16x4_t __rev0_689;  __rev0_689 = __builtin_shufflevector(__s0_689, __s0_689, 3, 2, 1, 0); \
  57938   uint32x4_t __rev1_689;  __rev1_689 = __builtin_shufflevector(__s1_689, __s1_689, 3, 2, 1, 0); \
  57939   __ret_689 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_689), (uint16x4_t)(__noswap_vqrshrn_n_u32(__rev1_689, __p2_689)))); \
  57940   __ret_689 = __builtin_shufflevector(__ret_689, __ret_689, 7, 6, 5, 4, 3, 2, 1, 0); \
  57941   __ret_689; \
  57942 })
  57943 #endif
  57944 
  57945 #ifdef __LITTLE_ENDIAN__
  57946 #define vqrshrn_high_n_u64(__p0_690, __p1_690, __p2_690) __extension__ ({ \
  57947   uint32x4_t __ret_690; \
  57948   uint32x2_t __s0_690 = __p0_690; \
  57949   uint64x2_t __s1_690 = __p1_690; \
  57950   __ret_690 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_690), (uint32x2_t)(vqrshrn_n_u64(__s1_690, __p2_690)))); \
  57951   __ret_690; \
  57952 })
  57953 #else
  57954 #define vqrshrn_high_n_u64(__p0_691, __p1_691, __p2_691) __extension__ ({ \
  57955   uint32x4_t __ret_691; \
  57956   uint32x2_t __s0_691 = __p0_691; \
  57957   uint64x2_t __s1_691 = __p1_691; \
  57958   uint32x2_t __rev0_691;  __rev0_691 = __builtin_shufflevector(__s0_691, __s0_691, 1, 0); \
  57959   uint64x2_t __rev1_691;  __rev1_691 = __builtin_shufflevector(__s1_691, __s1_691, 1, 0); \
  57960   __ret_691 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_691), (uint32x2_t)(__noswap_vqrshrn_n_u64(__rev1_691, __p2_691)))); \
  57961   __ret_691 = __builtin_shufflevector(__ret_691, __ret_691, 3, 2, 1, 0); \
  57962   __ret_691; \
  57963 })
  57964 #endif
  57965 
  57966 #ifdef __LITTLE_ENDIAN__
  57967 #define vqrshrn_high_n_u16(__p0_692, __p1_692, __p2_692) __extension__ ({ \
  57968   uint8x16_t __ret_692; \
  57969   uint8x8_t __s0_692 = __p0_692; \
  57970   uint16x8_t __s1_692 = __p1_692; \
  57971   __ret_692 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_692), (uint8x8_t)(vqrshrn_n_u16(__s1_692, __p2_692)))); \
  57972   __ret_692; \
  57973 })
  57974 #else
  57975 #define vqrshrn_high_n_u16(__p0_693, __p1_693, __p2_693) __extension__ ({ \
  57976   uint8x16_t __ret_693; \
  57977   uint8x8_t __s0_693 = __p0_693; \
  57978   uint16x8_t __s1_693 = __p1_693; \
  57979   uint8x8_t __rev0_693;  __rev0_693 = __builtin_shufflevector(__s0_693, __s0_693, 7, 6, 5, 4, 3, 2, 1, 0); \
  57980   uint16x8_t __rev1_693;  __rev1_693 = __builtin_shufflevector(__s1_693, __s1_693, 7, 6, 5, 4, 3, 2, 1, 0); \
  57981   __ret_693 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_693), (uint8x8_t)(__noswap_vqrshrn_n_u16(__rev1_693, __p2_693)))); \
  57982   __ret_693 = __builtin_shufflevector(__ret_693, __ret_693, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  57983   __ret_693; \
  57984 })
  57985 #endif
  57986 
  57987 #ifdef __LITTLE_ENDIAN__
  57988 #define vqrshrn_high_n_s32(__p0_694, __p1_694, __p2_694) __extension__ ({ \
  57989   int16x8_t __ret_694; \
  57990   int16x4_t __s0_694 = __p0_694; \
  57991   int32x4_t __s1_694 = __p1_694; \
  57992   __ret_694 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_694), (int16x4_t)(vqrshrn_n_s32(__s1_694, __p2_694)))); \
  57993   __ret_694; \
  57994 })
  57995 #else
  57996 #define vqrshrn_high_n_s32(__p0_695, __p1_695, __p2_695) __extension__ ({ \
  57997   int16x8_t __ret_695; \
  57998   int16x4_t __s0_695 = __p0_695; \
  57999   int32x4_t __s1_695 = __p1_695; \
  58000   int16x4_t __rev0_695;  __rev0_695 = __builtin_shufflevector(__s0_695, __s0_695, 3, 2, 1, 0); \
  58001   int32x4_t __rev1_695;  __rev1_695 = __builtin_shufflevector(__s1_695, __s1_695, 3, 2, 1, 0); \
  58002   __ret_695 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_695), (int16x4_t)(__noswap_vqrshrn_n_s32(__rev1_695, __p2_695)))); \
  58003   __ret_695 = __builtin_shufflevector(__ret_695, __ret_695, 7, 6, 5, 4, 3, 2, 1, 0); \
  58004   __ret_695; \
  58005 })
  58006 #endif
  58007 
  58008 #ifdef __LITTLE_ENDIAN__
  58009 #define vqrshrn_high_n_s64(__p0_696, __p1_696, __p2_696) __extension__ ({ \
  58010   int32x4_t __ret_696; \
  58011   int32x2_t __s0_696 = __p0_696; \
  58012   int64x2_t __s1_696 = __p1_696; \
  58013   __ret_696 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_696), (int32x2_t)(vqrshrn_n_s64(__s1_696, __p2_696)))); \
  58014   __ret_696; \
  58015 })
  58016 #else
  58017 #define vqrshrn_high_n_s64(__p0_697, __p1_697, __p2_697) __extension__ ({ \
  58018   int32x4_t __ret_697; \
  58019   int32x2_t __s0_697 = __p0_697; \
  58020   int64x2_t __s1_697 = __p1_697; \
  58021   int32x2_t __rev0_697;  __rev0_697 = __builtin_shufflevector(__s0_697, __s0_697, 1, 0); \
  58022   int64x2_t __rev1_697;  __rev1_697 = __builtin_shufflevector(__s1_697, __s1_697, 1, 0); \
  58023   __ret_697 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_697), (int32x2_t)(__noswap_vqrshrn_n_s64(__rev1_697, __p2_697)))); \
  58024   __ret_697 = __builtin_shufflevector(__ret_697, __ret_697, 3, 2, 1, 0); \
  58025   __ret_697; \
  58026 })
  58027 #endif
  58028 
  58029 #ifdef __LITTLE_ENDIAN__
  58030 #define vqrshrn_high_n_s16(__p0_698, __p1_698, __p2_698) __extension__ ({ \
  58031   int8x16_t __ret_698; \
  58032   int8x8_t __s0_698 = __p0_698; \
  58033   int16x8_t __s1_698 = __p1_698; \
  58034   __ret_698 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_698), (int8x8_t)(vqrshrn_n_s16(__s1_698, __p2_698)))); \
  58035   __ret_698; \
  58036 })
  58037 #else
  58038 #define vqrshrn_high_n_s16(__p0_699, __p1_699, __p2_699) __extension__ ({ \
  58039   int8x16_t __ret_699; \
  58040   int8x8_t __s0_699 = __p0_699; \
  58041   int16x8_t __s1_699 = __p1_699; \
  58042   int8x8_t __rev0_699;  __rev0_699 = __builtin_shufflevector(__s0_699, __s0_699, 7, 6, 5, 4, 3, 2, 1, 0); \
  58043   int16x8_t __rev1_699;  __rev1_699 = __builtin_shufflevector(__s1_699, __s1_699, 7, 6, 5, 4, 3, 2, 1, 0); \
  58044   __ret_699 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_699), (int8x8_t)(__noswap_vqrshrn_n_s16(__rev1_699, __p2_699)))); \
  58045   __ret_699 = __builtin_shufflevector(__ret_699, __ret_699, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  58046   __ret_699; \
  58047 })
  58048 #endif
  58049 
  58050 #define vqrshrns_n_u32(__p0, __p1) __extension__ ({ \
  58051   uint16_t __ret; \
  58052   uint32_t __s0 = __p0; \
  58053   __ret = (uint16_t) __builtin_neon_vqrshrns_n_u32(__s0, __p1); \
  58054   __ret; \
  58055 })
  58056 #define vqrshrnd_n_u64(__p0, __p1) __extension__ ({ \
  58057   uint32_t __ret; \
  58058   uint64_t __s0 = __p0; \
  58059   __ret = (uint32_t) __builtin_neon_vqrshrnd_n_u64(__s0, __p1); \
  58060   __ret; \
  58061 })
  58062 #define vqrshrnh_n_u16(__p0, __p1) __extension__ ({ \
  58063   uint8_t __ret; \
  58064   uint16_t __s0 = __p0; \
  58065   __ret = (uint8_t) __builtin_neon_vqrshrnh_n_u16(__s0, __p1); \
  58066   __ret; \
  58067 })
  58068 #define vqrshrns_n_s32(__p0, __p1) __extension__ ({ \
  58069   int16_t __ret; \
  58070   int32_t __s0 = __p0; \
  58071   __ret = (int16_t) __builtin_neon_vqrshrns_n_s32(__s0, __p1); \
  58072   __ret; \
  58073 })
  58074 #define vqrshrnd_n_s64(__p0, __p1) __extension__ ({ \
  58075   int32_t __ret; \
  58076   int64_t __s0 = __p0; \
  58077   __ret = (int32_t) __builtin_neon_vqrshrnd_n_s64(__s0, __p1); \
  58078   __ret; \
  58079 })
  58080 #define vqrshrnh_n_s16(__p0, __p1) __extension__ ({ \
  58081   int8_t __ret; \
  58082   int16_t __s0 = __p0; \
  58083   __ret = (int8_t) __builtin_neon_vqrshrnh_n_s16(__s0, __p1); \
  58084   __ret; \
  58085 })
  58086 #ifdef __LITTLE_ENDIAN__
  58087 #define vqrshrun_high_n_s32(__p0_700, __p1_700, __p2_700) __extension__ ({ \
  58088   int16x8_t __ret_700; \
  58089   int16x4_t __s0_700 = __p0_700; \
  58090   int32x4_t __s1_700 = __p1_700; \
  58091   __ret_700 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_700), (int16x4_t)(vqrshrun_n_s32(__s1_700, __p2_700)))); \
  58092   __ret_700; \
  58093 })
  58094 #else
  58095 #define vqrshrun_high_n_s32(__p0_701, __p1_701, __p2_701) __extension__ ({ \
  58096   int16x8_t __ret_701; \
  58097   int16x4_t __s0_701 = __p0_701; \
  58098   int32x4_t __s1_701 = __p1_701; \
  58099   int16x4_t __rev0_701;  __rev0_701 = __builtin_shufflevector(__s0_701, __s0_701, 3, 2, 1, 0); \
  58100   int32x4_t __rev1_701;  __rev1_701 = __builtin_shufflevector(__s1_701, __s1_701, 3, 2, 1, 0); \
  58101   __ret_701 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_701), (int16x4_t)(__noswap_vqrshrun_n_s32(__rev1_701, __p2_701)))); \
  58102   __ret_701 = __builtin_shufflevector(__ret_701, __ret_701, 7, 6, 5, 4, 3, 2, 1, 0); \
  58103   __ret_701; \
  58104 })
  58105 #endif
  58106 
  58107 #ifdef __LITTLE_ENDIAN__
  58108 #define vqrshrun_high_n_s64(__p0_702, __p1_702, __p2_702) __extension__ ({ \
  58109   int32x4_t __ret_702; \
  58110   int32x2_t __s0_702 = __p0_702; \
  58111   int64x2_t __s1_702 = __p1_702; \
  58112   __ret_702 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_702), (int32x2_t)(vqrshrun_n_s64(__s1_702, __p2_702)))); \
  58113   __ret_702; \
  58114 })
  58115 #else
  58116 #define vqrshrun_high_n_s64(__p0_703, __p1_703, __p2_703) __extension__ ({ \
  58117   int32x4_t __ret_703; \
  58118   int32x2_t __s0_703 = __p0_703; \
  58119   int64x2_t __s1_703 = __p1_703; \
  58120   int32x2_t __rev0_703;  __rev0_703 = __builtin_shufflevector(__s0_703, __s0_703, 1, 0); \
  58121   int64x2_t __rev1_703;  __rev1_703 = __builtin_shufflevector(__s1_703, __s1_703, 1, 0); \
  58122   __ret_703 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_703), (int32x2_t)(__noswap_vqrshrun_n_s64(__rev1_703, __p2_703)))); \
  58123   __ret_703 = __builtin_shufflevector(__ret_703, __ret_703, 3, 2, 1, 0); \
  58124   __ret_703; \
  58125 })
  58126 #endif
  58127 
  58128 #ifdef __LITTLE_ENDIAN__
  58129 #define vqrshrun_high_n_s16(__p0_704, __p1_704, __p2_704) __extension__ ({ \
  58130   int8x16_t __ret_704; \
  58131   int8x8_t __s0_704 = __p0_704; \
  58132   int16x8_t __s1_704 = __p1_704; \
  58133   __ret_704 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_704), (int8x8_t)(vqrshrun_n_s16(__s1_704, __p2_704)))); \
  58134   __ret_704; \
  58135 })
  58136 #else
  58137 #define vqrshrun_high_n_s16(__p0_705, __p1_705, __p2_705) __extension__ ({ \
  58138   int8x16_t __ret_705; \
  58139   int8x8_t __s0_705 = __p0_705; \
  58140   int16x8_t __s1_705 = __p1_705; \
  58141   int8x8_t __rev0_705;  __rev0_705 = __builtin_shufflevector(__s0_705, __s0_705, 7, 6, 5, 4, 3, 2, 1, 0); \
  58142   int16x8_t __rev1_705;  __rev1_705 = __builtin_shufflevector(__s1_705, __s1_705, 7, 6, 5, 4, 3, 2, 1, 0); \
  58143   __ret_705 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_705), (int8x8_t)(__noswap_vqrshrun_n_s16(__rev1_705, __p2_705)))); \
  58144   __ret_705 = __builtin_shufflevector(__ret_705, __ret_705, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  58145   __ret_705; \
  58146 })
  58147 #endif
  58148 
  58149 #define vqrshruns_n_s32(__p0, __p1) __extension__ ({ \
  58150   uint16_t __ret; \
  58151   int32_t __s0 = __p0; \
  58152   __ret = (uint16_t) __builtin_neon_vqrshruns_n_s32(__s0, __p1); \
  58153   __ret; \
  58154 })
  58155 #define vqrshrund_n_s64(__p0, __p1) __extension__ ({ \
  58156   uint32_t __ret; \
  58157   int64_t __s0 = __p0; \
  58158   __ret = (uint32_t) __builtin_neon_vqrshrund_n_s64(__s0, __p1); \
  58159   __ret; \
  58160 })
  58161 #define vqrshrunh_n_s16(__p0, __p1) __extension__ ({ \
  58162   uint8_t __ret; \
  58163   int16_t __s0 = __p0; \
  58164   __ret = (uint8_t) __builtin_neon_vqrshrunh_n_s16(__s0, __p1); \
  58165   __ret; \
  58166 })
  58167 __ai __attribute__((target("neon"))) uint8_t vqshlb_u8(uint8_t __p0, int8_t __p1) {
  58168   uint8_t __ret;
  58169   __ret = (uint8_t) __builtin_neon_vqshlb_u8(__p0, __p1);
  58170   return __ret;
  58171 }
  58172 __ai __attribute__((target("neon"))) uint32_t vqshls_u32(uint32_t __p0, int32_t __p1) {
  58173   uint32_t __ret;
  58174   __ret = (uint32_t) __builtin_neon_vqshls_u32(__p0, __p1);
  58175   return __ret;
  58176 }
  58177 __ai __attribute__((target("neon"))) uint64_t vqshld_u64(uint64_t __p0, int64_t __p1) {
  58178   uint64_t __ret;
  58179   __ret = (uint64_t) __builtin_neon_vqshld_u64(__p0, __p1);
  58180   return __ret;
  58181 }
  58182 __ai __attribute__((target("neon"))) uint16_t vqshlh_u16(uint16_t __p0, int16_t __p1) {
  58183   uint16_t __ret;
  58184   __ret = (uint16_t) __builtin_neon_vqshlh_u16(__p0, __p1);
  58185   return __ret;
  58186 }
  58187 __ai __attribute__((target("neon"))) int8_t vqshlb_s8(int8_t __p0, int8_t __p1) {
  58188   int8_t __ret;
  58189   __ret = (int8_t) __builtin_neon_vqshlb_s8(__p0, __p1);
  58190   return __ret;
  58191 }
  58192 __ai __attribute__((target("neon"))) int32_t vqshls_s32(int32_t __p0, int32_t __p1) {
  58193   int32_t __ret;
  58194   __ret = (int32_t) __builtin_neon_vqshls_s32(__p0, __p1);
  58195   return __ret;
  58196 }
  58197 __ai __attribute__((target("neon"))) int64_t vqshld_s64(int64_t __p0, int64_t __p1) {
  58198   int64_t __ret;
  58199   __ret = (int64_t) __builtin_neon_vqshld_s64(__p0, __p1);
  58200   return __ret;
  58201 }
  58202 __ai __attribute__((target("neon"))) int16_t vqshlh_s16(int16_t __p0, int16_t __p1) {
  58203   int16_t __ret;
  58204   __ret = (int16_t) __builtin_neon_vqshlh_s16(__p0, __p1);
  58205   return __ret;
  58206 }
  58207 #define vqshlb_n_u8(__p0, __p1) __extension__ ({ \
  58208   uint8_t __ret; \
  58209   uint8_t __s0 = __p0; \
  58210   __ret = (uint8_t) __builtin_neon_vqshlb_n_u8(__s0, __p1); \
  58211   __ret; \
  58212 })
  58213 #define vqshls_n_u32(__p0, __p1) __extension__ ({ \
  58214   uint32_t __ret; \
  58215   uint32_t __s0 = __p0; \
  58216   __ret = (uint32_t) __builtin_neon_vqshls_n_u32(__s0, __p1); \
  58217   __ret; \
  58218 })
  58219 #define vqshld_n_u64(__p0, __p1) __extension__ ({ \
  58220   uint64_t __ret; \
  58221   uint64_t __s0 = __p0; \
  58222   __ret = (uint64_t) __builtin_neon_vqshld_n_u64(__s0, __p1); \
  58223   __ret; \
  58224 })
  58225 #define vqshlh_n_u16(__p0, __p1) __extension__ ({ \
  58226   uint16_t __ret; \
  58227   uint16_t __s0 = __p0; \
  58228   __ret = (uint16_t) __builtin_neon_vqshlh_n_u16(__s0, __p1); \
  58229   __ret; \
  58230 })
  58231 #define vqshlb_n_s8(__p0, __p1) __extension__ ({ \
  58232   int8_t __ret; \
  58233   int8_t __s0 = __p0; \
  58234   __ret = (int8_t) __builtin_neon_vqshlb_n_s8(__s0, __p1); \
  58235   __ret; \
  58236 })
  58237 #define vqshls_n_s32(__p0, __p1) __extension__ ({ \
  58238   int32_t __ret; \
  58239   int32_t __s0 = __p0; \
  58240   __ret = (int32_t) __builtin_neon_vqshls_n_s32(__s0, __p1); \
  58241   __ret; \
  58242 })
  58243 #define vqshld_n_s64(__p0, __p1) __extension__ ({ \
  58244   int64_t __ret; \
  58245   int64_t __s0 = __p0; \
  58246   __ret = (int64_t) __builtin_neon_vqshld_n_s64(__s0, __p1); \
  58247   __ret; \
  58248 })
  58249 #define vqshlh_n_s16(__p0, __p1) __extension__ ({ \
  58250   int16_t __ret; \
  58251   int16_t __s0 = __p0; \
  58252   __ret = (int16_t) __builtin_neon_vqshlh_n_s16(__s0, __p1); \
  58253   __ret; \
  58254 })
  58255 #define vqshlub_n_s8(__p0, __p1) __extension__ ({ \
  58256   int8_t __ret; \
  58257   int8_t __s0 = __p0; \
  58258   __ret = (int8_t) __builtin_neon_vqshlub_n_s8(__s0, __p1); \
  58259   __ret; \
  58260 })
  58261 #define vqshlus_n_s32(__p0, __p1) __extension__ ({ \
  58262   int32_t __ret; \
  58263   int32_t __s0 = __p0; \
  58264   __ret = (int32_t) __builtin_neon_vqshlus_n_s32(__s0, __p1); \
  58265   __ret; \
  58266 })
  58267 #define vqshlud_n_s64(__p0, __p1) __extension__ ({ \
  58268   int64_t __ret; \
  58269   int64_t __s0 = __p0; \
  58270   __ret = (int64_t) __builtin_neon_vqshlud_n_s64(__s0, __p1); \
  58271   __ret; \
  58272 })
  58273 #define vqshluh_n_s16(__p0, __p1) __extension__ ({ \
  58274   int16_t __ret; \
  58275   int16_t __s0 = __p0; \
  58276   __ret = (int16_t) __builtin_neon_vqshluh_n_s16(__s0, __p1); \
  58277   __ret; \
  58278 })
  58279 #ifdef __LITTLE_ENDIAN__
  58280 #define vqshrn_high_n_u32(__p0_706, __p1_706, __p2_706) __extension__ ({ \
  58281   uint16x8_t __ret_706; \
  58282   uint16x4_t __s0_706 = __p0_706; \
  58283   uint32x4_t __s1_706 = __p1_706; \
  58284   __ret_706 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_706), (uint16x4_t)(vqshrn_n_u32(__s1_706, __p2_706)))); \
  58285   __ret_706; \
  58286 })
  58287 #else
  58288 #define vqshrn_high_n_u32(__p0_707, __p1_707, __p2_707) __extension__ ({ \
  58289   uint16x8_t __ret_707; \
  58290   uint16x4_t __s0_707 = __p0_707; \
  58291   uint32x4_t __s1_707 = __p1_707; \
  58292   uint16x4_t __rev0_707;  __rev0_707 = __builtin_shufflevector(__s0_707, __s0_707, 3, 2, 1, 0); \
  58293   uint32x4_t __rev1_707;  __rev1_707 = __builtin_shufflevector(__s1_707, __s1_707, 3, 2, 1, 0); \
  58294   __ret_707 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_707), (uint16x4_t)(__noswap_vqshrn_n_u32(__rev1_707, __p2_707)))); \
  58295   __ret_707 = __builtin_shufflevector(__ret_707, __ret_707, 7, 6, 5, 4, 3, 2, 1, 0); \
  58296   __ret_707; \
  58297 })
  58298 #endif
  58299 
  58300 #ifdef __LITTLE_ENDIAN__
  58301 #define vqshrn_high_n_u64(__p0_708, __p1_708, __p2_708) __extension__ ({ \
  58302   uint32x4_t __ret_708; \
  58303   uint32x2_t __s0_708 = __p0_708; \
  58304   uint64x2_t __s1_708 = __p1_708; \
  58305   __ret_708 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_708), (uint32x2_t)(vqshrn_n_u64(__s1_708, __p2_708)))); \
  58306   __ret_708; \
  58307 })
  58308 #else
  58309 #define vqshrn_high_n_u64(__p0_709, __p1_709, __p2_709) __extension__ ({ \
  58310   uint32x4_t __ret_709; \
  58311   uint32x2_t __s0_709 = __p0_709; \
  58312   uint64x2_t __s1_709 = __p1_709; \
  58313   uint32x2_t __rev0_709;  __rev0_709 = __builtin_shufflevector(__s0_709, __s0_709, 1, 0); \
  58314   uint64x2_t __rev1_709;  __rev1_709 = __builtin_shufflevector(__s1_709, __s1_709, 1, 0); \
  58315   __ret_709 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_709), (uint32x2_t)(__noswap_vqshrn_n_u64(__rev1_709, __p2_709)))); \
  58316   __ret_709 = __builtin_shufflevector(__ret_709, __ret_709, 3, 2, 1, 0); \
  58317   __ret_709; \
  58318 })
  58319 #endif
  58320 
  58321 #ifdef __LITTLE_ENDIAN__
  58322 #define vqshrn_high_n_u16(__p0_710, __p1_710, __p2_710) __extension__ ({ \
  58323   uint8x16_t __ret_710; \
  58324   uint8x8_t __s0_710 = __p0_710; \
  58325   uint16x8_t __s1_710 = __p1_710; \
  58326   __ret_710 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_710), (uint8x8_t)(vqshrn_n_u16(__s1_710, __p2_710)))); \
  58327   __ret_710; \
  58328 })
  58329 #else
  58330 #define vqshrn_high_n_u16(__p0_711, __p1_711, __p2_711) __extension__ ({ \
  58331   uint8x16_t __ret_711; \
  58332   uint8x8_t __s0_711 = __p0_711; \
  58333   uint16x8_t __s1_711 = __p1_711; \
  58334   uint8x8_t __rev0_711;  __rev0_711 = __builtin_shufflevector(__s0_711, __s0_711, 7, 6, 5, 4, 3, 2, 1, 0); \
  58335   uint16x8_t __rev1_711;  __rev1_711 = __builtin_shufflevector(__s1_711, __s1_711, 7, 6, 5, 4, 3, 2, 1, 0); \
  58336   __ret_711 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_711), (uint8x8_t)(__noswap_vqshrn_n_u16(__rev1_711, __p2_711)))); \
  58337   __ret_711 = __builtin_shufflevector(__ret_711, __ret_711, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  58338   __ret_711; \
  58339 })
  58340 #endif
  58341 
  58342 #ifdef __LITTLE_ENDIAN__
  58343 #define vqshrn_high_n_s32(__p0_712, __p1_712, __p2_712) __extension__ ({ \
  58344   int16x8_t __ret_712; \
  58345   int16x4_t __s0_712 = __p0_712; \
  58346   int32x4_t __s1_712 = __p1_712; \
  58347   __ret_712 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_712), (int16x4_t)(vqshrn_n_s32(__s1_712, __p2_712)))); \
  58348   __ret_712; \
  58349 })
  58350 #else
  58351 #define vqshrn_high_n_s32(__p0_713, __p1_713, __p2_713) __extension__ ({ \
  58352   int16x8_t __ret_713; \
  58353   int16x4_t __s0_713 = __p0_713; \
  58354   int32x4_t __s1_713 = __p1_713; \
  58355   int16x4_t __rev0_713;  __rev0_713 = __builtin_shufflevector(__s0_713, __s0_713, 3, 2, 1, 0); \
  58356   int32x4_t __rev1_713;  __rev1_713 = __builtin_shufflevector(__s1_713, __s1_713, 3, 2, 1, 0); \
  58357   __ret_713 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_713), (int16x4_t)(__noswap_vqshrn_n_s32(__rev1_713, __p2_713)))); \
  58358   __ret_713 = __builtin_shufflevector(__ret_713, __ret_713, 7, 6, 5, 4, 3, 2, 1, 0); \
  58359   __ret_713; \
  58360 })
  58361 #endif
  58362 
  58363 #ifdef __LITTLE_ENDIAN__
  58364 #define vqshrn_high_n_s64(__p0_714, __p1_714, __p2_714) __extension__ ({ \
  58365   int32x4_t __ret_714; \
  58366   int32x2_t __s0_714 = __p0_714; \
  58367   int64x2_t __s1_714 = __p1_714; \
  58368   __ret_714 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_714), (int32x2_t)(vqshrn_n_s64(__s1_714, __p2_714)))); \
  58369   __ret_714; \
  58370 })
  58371 #else
  58372 #define vqshrn_high_n_s64(__p0_715, __p1_715, __p2_715) __extension__ ({ \
  58373   int32x4_t __ret_715; \
  58374   int32x2_t __s0_715 = __p0_715; \
  58375   int64x2_t __s1_715 = __p1_715; \
  58376   int32x2_t __rev0_715;  __rev0_715 = __builtin_shufflevector(__s0_715, __s0_715, 1, 0); \
  58377   int64x2_t __rev1_715;  __rev1_715 = __builtin_shufflevector(__s1_715, __s1_715, 1, 0); \
  58378   __ret_715 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_715), (int32x2_t)(__noswap_vqshrn_n_s64(__rev1_715, __p2_715)))); \
  58379   __ret_715 = __builtin_shufflevector(__ret_715, __ret_715, 3, 2, 1, 0); \
  58380   __ret_715; \
  58381 })
  58382 #endif
  58383 
  58384 #ifdef __LITTLE_ENDIAN__
  58385 #define vqshrn_high_n_s16(__p0_716, __p1_716, __p2_716) __extension__ ({ \
  58386   int8x16_t __ret_716; \
  58387   int8x8_t __s0_716 = __p0_716; \
  58388   int16x8_t __s1_716 = __p1_716; \
  58389   __ret_716 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_716), (int8x8_t)(vqshrn_n_s16(__s1_716, __p2_716)))); \
  58390   __ret_716; \
  58391 })
  58392 #else
  58393 #define vqshrn_high_n_s16(__p0_717, __p1_717, __p2_717) __extension__ ({ \
  58394   int8x16_t __ret_717; \
  58395   int8x8_t __s0_717 = __p0_717; \
  58396   int16x8_t __s1_717 = __p1_717; \
  58397   int8x8_t __rev0_717;  __rev0_717 = __builtin_shufflevector(__s0_717, __s0_717, 7, 6, 5, 4, 3, 2, 1, 0); \
  58398   int16x8_t __rev1_717;  __rev1_717 = __builtin_shufflevector(__s1_717, __s1_717, 7, 6, 5, 4, 3, 2, 1, 0); \
  58399   __ret_717 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_717), (int8x8_t)(__noswap_vqshrn_n_s16(__rev1_717, __p2_717)))); \
  58400   __ret_717 = __builtin_shufflevector(__ret_717, __ret_717, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  58401   __ret_717; \
  58402 })
  58403 #endif
  58404 
  58405 #define vqshrns_n_u32(__p0, __p1) __extension__ ({ \
  58406   uint16_t __ret; \
  58407   uint32_t __s0 = __p0; \
  58408   __ret = (uint16_t) __builtin_neon_vqshrns_n_u32(__s0, __p1); \
  58409   __ret; \
  58410 })
  58411 #define vqshrnd_n_u64(__p0, __p1) __extension__ ({ \
  58412   uint32_t __ret; \
  58413   uint64_t __s0 = __p0; \
  58414   __ret = (uint32_t) __builtin_neon_vqshrnd_n_u64(__s0, __p1); \
  58415   __ret; \
  58416 })
  58417 #define vqshrnh_n_u16(__p0, __p1) __extension__ ({ \
  58418   uint8_t __ret; \
  58419   uint16_t __s0 = __p0; \
  58420   __ret = (uint8_t) __builtin_neon_vqshrnh_n_u16(__s0, __p1); \
  58421   __ret; \
  58422 })
  58423 #define vqshrns_n_s32(__p0, __p1) __extension__ ({ \
  58424   int16_t __ret; \
  58425   int32_t __s0 = __p0; \
  58426   __ret = (int16_t) __builtin_neon_vqshrns_n_s32(__s0, __p1); \
  58427   __ret; \
  58428 })
  58429 #define vqshrnd_n_s64(__p0, __p1) __extension__ ({ \
  58430   int32_t __ret; \
  58431   int64_t __s0 = __p0; \
  58432   __ret = (int32_t) __builtin_neon_vqshrnd_n_s64(__s0, __p1); \
  58433   __ret; \
  58434 })
  58435 #define vqshrnh_n_s16(__p0, __p1) __extension__ ({ \
  58436   int8_t __ret; \
  58437   int16_t __s0 = __p0; \
  58438   __ret = (int8_t) __builtin_neon_vqshrnh_n_s16(__s0, __p1); \
  58439   __ret; \
  58440 })
  58441 #ifdef __LITTLE_ENDIAN__
  58442 #define vqshrun_high_n_s32(__p0_718, __p1_718, __p2_718) __extension__ ({ \
  58443   int16x8_t __ret_718; \
  58444   int16x4_t __s0_718 = __p0_718; \
  58445   int32x4_t __s1_718 = __p1_718; \
  58446   __ret_718 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_718), (int16x4_t)(vqshrun_n_s32(__s1_718, __p2_718)))); \
  58447   __ret_718; \
  58448 })
  58449 #else
  58450 #define vqshrun_high_n_s32(__p0_719, __p1_719, __p2_719) __extension__ ({ \
  58451   int16x8_t __ret_719; \
  58452   int16x4_t __s0_719 = __p0_719; \
  58453   int32x4_t __s1_719 = __p1_719; \
  58454   int16x4_t __rev0_719;  __rev0_719 = __builtin_shufflevector(__s0_719, __s0_719, 3, 2, 1, 0); \
  58455   int32x4_t __rev1_719;  __rev1_719 = __builtin_shufflevector(__s1_719, __s1_719, 3, 2, 1, 0); \
  58456   __ret_719 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_719), (int16x4_t)(__noswap_vqshrun_n_s32(__rev1_719, __p2_719)))); \
  58457   __ret_719 = __builtin_shufflevector(__ret_719, __ret_719, 7, 6, 5, 4, 3, 2, 1, 0); \
  58458   __ret_719; \
  58459 })
  58460 #endif
  58461 
  58462 #ifdef __LITTLE_ENDIAN__
  58463 #define vqshrun_high_n_s64(__p0_720, __p1_720, __p2_720) __extension__ ({ \
  58464   int32x4_t __ret_720; \
  58465   int32x2_t __s0_720 = __p0_720; \
  58466   int64x2_t __s1_720 = __p1_720; \
  58467   __ret_720 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_720), (int32x2_t)(vqshrun_n_s64(__s1_720, __p2_720)))); \
  58468   __ret_720; \
  58469 })
  58470 #else
  58471 #define vqshrun_high_n_s64(__p0_721, __p1_721, __p2_721) __extension__ ({ \
  58472   int32x4_t __ret_721; \
  58473   int32x2_t __s0_721 = __p0_721; \
  58474   int64x2_t __s1_721 = __p1_721; \
  58475   int32x2_t __rev0_721;  __rev0_721 = __builtin_shufflevector(__s0_721, __s0_721, 1, 0); \
  58476   int64x2_t __rev1_721;  __rev1_721 = __builtin_shufflevector(__s1_721, __s1_721, 1, 0); \
  58477   __ret_721 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_721), (int32x2_t)(__noswap_vqshrun_n_s64(__rev1_721, __p2_721)))); \
  58478   __ret_721 = __builtin_shufflevector(__ret_721, __ret_721, 3, 2, 1, 0); \
  58479   __ret_721; \
  58480 })
  58481 #endif
  58482 
  58483 #ifdef __LITTLE_ENDIAN__
  58484 #define vqshrun_high_n_s16(__p0_722, __p1_722, __p2_722) __extension__ ({ \
  58485   int8x16_t __ret_722; \
  58486   int8x8_t __s0_722 = __p0_722; \
  58487   int16x8_t __s1_722 = __p1_722; \
  58488   __ret_722 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_722), (int8x8_t)(vqshrun_n_s16(__s1_722, __p2_722)))); \
  58489   __ret_722; \
  58490 })
  58491 #else
  58492 #define vqshrun_high_n_s16(__p0_723, __p1_723, __p2_723) __extension__ ({ \
  58493   int8x16_t __ret_723; \
  58494   int8x8_t __s0_723 = __p0_723; \
  58495   int16x8_t __s1_723 = __p1_723; \
  58496   int8x8_t __rev0_723;  __rev0_723 = __builtin_shufflevector(__s0_723, __s0_723, 7, 6, 5, 4, 3, 2, 1, 0); \
  58497   int16x8_t __rev1_723;  __rev1_723 = __builtin_shufflevector(__s1_723, __s1_723, 7, 6, 5, 4, 3, 2, 1, 0); \
  58498   __ret_723 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_723), (int8x8_t)(__noswap_vqshrun_n_s16(__rev1_723, __p2_723)))); \
  58499   __ret_723 = __builtin_shufflevector(__ret_723, __ret_723, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  58500   __ret_723; \
  58501 })
  58502 #endif
  58503 
  58504 #define vqshruns_n_s32(__p0, __p1) __extension__ ({ \
  58505   uint16_t __ret; \
  58506   int32_t __s0 = __p0; \
  58507   __ret = (uint16_t) __builtin_neon_vqshruns_n_s32(__s0, __p1); \
  58508   __ret; \
  58509 })
  58510 #define vqshrund_n_s64(__p0, __p1) __extension__ ({ \
  58511   uint32_t __ret; \
  58512   int64_t __s0 = __p0; \
  58513   __ret = (uint32_t) __builtin_neon_vqshrund_n_s64(__s0, __p1); \
  58514   __ret; \
  58515 })
  58516 #define vqshrunh_n_s16(__p0, __p1) __extension__ ({ \
  58517   uint8_t __ret; \
  58518   int16_t __s0 = __p0; \
  58519   __ret = (uint8_t) __builtin_neon_vqshrunh_n_s16(__s0, __p1); \
  58520   __ret; \
  58521 })
  58522 __ai __attribute__((target("neon"))) uint8_t vqsubb_u8(uint8_t __p0, uint8_t __p1) {
  58523   uint8_t __ret;
  58524   __ret = (uint8_t) __builtin_neon_vqsubb_u8(__p0, __p1);
  58525   return __ret;
  58526 }
  58527 __ai __attribute__((target("neon"))) uint32_t vqsubs_u32(uint32_t __p0, uint32_t __p1) {
  58528   uint32_t __ret;
  58529   __ret = (uint32_t) __builtin_neon_vqsubs_u32(__p0, __p1);
  58530   return __ret;
  58531 }
  58532 __ai __attribute__((target("neon"))) uint64_t vqsubd_u64(uint64_t __p0, uint64_t __p1) {
  58533   uint64_t __ret;
  58534   __ret = (uint64_t) __builtin_neon_vqsubd_u64(__p0, __p1);
  58535   return __ret;
  58536 }
  58537 __ai __attribute__((target("neon"))) uint16_t vqsubh_u16(uint16_t __p0, uint16_t __p1) {
  58538   uint16_t __ret;
  58539   __ret = (uint16_t) __builtin_neon_vqsubh_u16(__p0, __p1);
  58540   return __ret;
  58541 }
  58542 __ai __attribute__((target("neon"))) int8_t vqsubb_s8(int8_t __p0, int8_t __p1) {
  58543   int8_t __ret;
  58544   __ret = (int8_t) __builtin_neon_vqsubb_s8(__p0, __p1);
  58545   return __ret;
  58546 }
  58547 __ai __attribute__((target("neon"))) int32_t vqsubs_s32(int32_t __p0, int32_t __p1) {
  58548   int32_t __ret;
  58549   __ret = (int32_t) __builtin_neon_vqsubs_s32(__p0, __p1);
  58550   return __ret;
  58551 }
  58552 __ai __attribute__((target("neon"))) int64_t vqsubd_s64(int64_t __p0, int64_t __p1) {
  58553   int64_t __ret;
  58554   __ret = (int64_t) __builtin_neon_vqsubd_s64(__p0, __p1);
  58555   return __ret;
  58556 }
  58557 __ai __attribute__((target("neon"))) int16_t vqsubh_s16(int16_t __p0, int16_t __p1) {
  58558   int16_t __ret;
  58559   __ret = (int16_t) __builtin_neon_vqsubh_s16(__p0, __p1);
  58560   return __ret;
  58561 }
  58562 #ifdef __LITTLE_ENDIAN__
  58563 __ai __attribute__((target("neon"))) poly8x8_t vqtbl1_p8(poly8x16_t __p0, uint8x8_t __p1) {
  58564   poly8x8_t __ret;
  58565   __ret = (poly8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__p0, (int8x8_t)__p1, 4);
  58566   return __ret;
  58567 }
  58568 #else
  58569 __ai __attribute__((target("neon"))) poly8x8_t vqtbl1_p8(poly8x16_t __p0, uint8x8_t __p1) {
  58570   poly8x8_t __ret;
  58571   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58572   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58573   __ret = (poly8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__rev0, (int8x8_t)__rev1, 4);
  58574   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58575   return __ret;
  58576 }
  58577 #endif
  58578 
  58579 #ifdef __LITTLE_ENDIAN__
  58580 __ai __attribute__((target("neon"))) poly8x16_t vqtbl1q_p8(poly8x16_t __p0, uint8x16_t __p1) {
  58581   poly8x16_t __ret;
  58582   __ret = (poly8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__p0, (int8x16_t)__p1, 36);
  58583   return __ret;
  58584 }
  58585 #else
  58586 __ai __attribute__((target("neon"))) poly8x16_t vqtbl1q_p8(poly8x16_t __p0, uint8x16_t __p1) {
  58587   poly8x16_t __ret;
  58588   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58589   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58590   __ret = (poly8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, 36);
  58591   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58592   return __ret;
  58593 }
  58594 #endif
  58595 
  58596 #ifdef __LITTLE_ENDIAN__
  58597 __ai __attribute__((target("neon"))) uint8x16_t vqtbl1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  58598   uint8x16_t __ret;
  58599   __ret = (uint8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  58600   return __ret;
  58601 }
  58602 #else
  58603 __ai __attribute__((target("neon"))) uint8x16_t vqtbl1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  58604   uint8x16_t __ret;
  58605   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58606   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58607   __ret = (uint8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  58608   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58609   return __ret;
  58610 }
  58611 #endif
  58612 
  58613 #ifdef __LITTLE_ENDIAN__
  58614 __ai __attribute__((target("neon"))) int8x16_t vqtbl1q_s8(int8x16_t __p0, uint8x16_t __p1) {
  58615   int8x16_t __ret;
  58616   __ret = (int8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  58617   return __ret;
  58618 }
  58619 #else
  58620 __ai __attribute__((target("neon"))) int8x16_t vqtbl1q_s8(int8x16_t __p0, uint8x16_t __p1) {
  58621   int8x16_t __ret;
  58622   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58623   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58624   __ret = (int8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  58625   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58626   return __ret;
  58627 }
  58628 #endif
  58629 
  58630 #ifdef __LITTLE_ENDIAN__
  58631 __ai __attribute__((target("neon"))) uint8x8_t vqtbl1_u8(uint8x16_t __p0, uint8x8_t __p1) {
  58632   uint8x8_t __ret;
  58633   __ret = (uint8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__p0, (int8x8_t)__p1, 16);
  58634   return __ret;
  58635 }
  58636 #else
  58637 __ai __attribute__((target("neon"))) uint8x8_t vqtbl1_u8(uint8x16_t __p0, uint8x8_t __p1) {
  58638   uint8x8_t __ret;
  58639   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58640   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58641   __ret = (uint8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__rev0, (int8x8_t)__rev1, 16);
  58642   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58643   return __ret;
  58644 }
  58645 #endif
  58646 
  58647 #ifdef __LITTLE_ENDIAN__
  58648 __ai __attribute__((target("neon"))) int8x8_t vqtbl1_s8(int8x16_t __p0, uint8x8_t __p1) {
  58649   int8x8_t __ret;
  58650   __ret = (int8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__p0, (int8x8_t)__p1, 0);
  58651   return __ret;
  58652 }
  58653 #else
  58654 __ai __attribute__((target("neon"))) int8x8_t vqtbl1_s8(int8x16_t __p0, uint8x8_t __p1) {
  58655   int8x8_t __ret;
  58656   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58657   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58658   __ret = (int8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__rev0, (int8x8_t)__rev1, 0);
  58659   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58660   return __ret;
  58661 }
  58662 #endif
  58663 
  58664 #ifdef __LITTLE_ENDIAN__
  58665 __ai __attribute__((target("neon"))) poly8x8_t vqtbl2_p8(poly8x16x2_t __p0, uint8x8_t __p1) {
  58666   poly8x8_t __ret;
  58667   __ret = (poly8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x8_t)__p1, 4);
  58668   return __ret;
  58669 }
  58670 #else
  58671 __ai __attribute__((target("neon"))) poly8x8_t vqtbl2_p8(poly8x16x2_t __p0, uint8x8_t __p1) {
  58672   poly8x8_t __ret;
  58673   poly8x16x2_t __rev0;
  58674   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58675   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58676   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58677   __ret = (poly8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, 4);
  58678   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58679   return __ret;
  58680 }
  58681 #endif
  58682 
  58683 #ifdef __LITTLE_ENDIAN__
  58684 __ai __attribute__((target("neon"))) poly8x16_t vqtbl2q_p8(poly8x16x2_t __p0, uint8x16_t __p1) {
  58685   poly8x16_t __ret;
  58686   __ret = (poly8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p1, 36);
  58687   return __ret;
  58688 }
  58689 #else
  58690 __ai __attribute__((target("neon"))) poly8x16_t vqtbl2q_p8(poly8x16x2_t __p0, uint8x16_t __p1) {
  58691   poly8x16_t __ret;
  58692   poly8x16x2_t __rev0;
  58693   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58694   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58695   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58696   __ret = (poly8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, 36);
  58697   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58698   return __ret;
  58699 }
  58700 #endif
  58701 
  58702 #ifdef __LITTLE_ENDIAN__
  58703 __ai __attribute__((target("neon"))) uint8x16_t vqtbl2q_u8(uint8x16x2_t __p0, uint8x16_t __p1) {
  58704   uint8x16_t __ret;
  58705   __ret = (uint8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p1, 48);
  58706   return __ret;
  58707 }
  58708 #else
  58709 __ai __attribute__((target("neon"))) uint8x16_t vqtbl2q_u8(uint8x16x2_t __p0, uint8x16_t __p1) {
  58710   uint8x16_t __ret;
  58711   uint8x16x2_t __rev0;
  58712   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58713   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58714   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58715   __ret = (uint8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, 48);
  58716   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58717   return __ret;
  58718 }
  58719 #endif
  58720 
  58721 #ifdef __LITTLE_ENDIAN__
  58722 __ai __attribute__((target("neon"))) int8x16_t vqtbl2q_s8(int8x16x2_t __p0, uint8x16_t __p1) {
  58723   int8x16_t __ret;
  58724   __ret = (int8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p1, 32);
  58725   return __ret;
  58726 }
  58727 #else
  58728 __ai __attribute__((target("neon"))) int8x16_t vqtbl2q_s8(int8x16x2_t __p0, uint8x16_t __p1) {
  58729   int8x16_t __ret;
  58730   int8x16x2_t __rev0;
  58731   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58732   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58733   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58734   __ret = (int8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, 32);
  58735   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58736   return __ret;
  58737 }
  58738 #endif
  58739 
  58740 #ifdef __LITTLE_ENDIAN__
  58741 __ai __attribute__((target("neon"))) uint8x8_t vqtbl2_u8(uint8x16x2_t __p0, uint8x8_t __p1) {
  58742   uint8x8_t __ret;
  58743   __ret = (uint8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x8_t)__p1, 16);
  58744   return __ret;
  58745 }
  58746 #else
  58747 __ai __attribute__((target("neon"))) uint8x8_t vqtbl2_u8(uint8x16x2_t __p0, uint8x8_t __p1) {
  58748   uint8x8_t __ret;
  58749   uint8x16x2_t __rev0;
  58750   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58751   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58752   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58753   __ret = (uint8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, 16);
  58754   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58755   return __ret;
  58756 }
  58757 #endif
  58758 
  58759 #ifdef __LITTLE_ENDIAN__
  58760 __ai __attribute__((target("neon"))) int8x8_t vqtbl2_s8(int8x16x2_t __p0, uint8x8_t __p1) {
  58761   int8x8_t __ret;
  58762   __ret = (int8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x8_t)__p1, 0);
  58763   return __ret;
  58764 }
  58765 #else
  58766 __ai __attribute__((target("neon"))) int8x8_t vqtbl2_s8(int8x16x2_t __p0, uint8x8_t __p1) {
  58767   int8x8_t __ret;
  58768   int8x16x2_t __rev0;
  58769   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58770   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58771   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58772   __ret = (int8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, 0);
  58773   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58774   return __ret;
  58775 }
  58776 #endif
  58777 
  58778 #ifdef __LITTLE_ENDIAN__
  58779 __ai __attribute__((target("neon"))) poly8x8_t vqtbl3_p8(poly8x16x3_t __p0, uint8x8_t __p1) {
  58780   poly8x8_t __ret;
  58781   __ret = (poly8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x8_t)__p1, 4);
  58782   return __ret;
  58783 }
  58784 #else
  58785 __ai __attribute__((target("neon"))) poly8x8_t vqtbl3_p8(poly8x16x3_t __p0, uint8x8_t __p1) {
  58786   poly8x8_t __ret;
  58787   poly8x16x3_t __rev0;
  58788   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58789   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58790   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58791   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58792   __ret = (poly8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x8_t)__rev1, 4);
  58793   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58794   return __ret;
  58795 }
  58796 #endif
  58797 
  58798 #ifdef __LITTLE_ENDIAN__
  58799 __ai __attribute__((target("neon"))) poly8x16_t vqtbl3q_p8(poly8x16x3_t __p0, uint8x16_t __p1) {
  58800   poly8x16_t __ret;
  58801   __ret = (poly8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p1, 36);
  58802   return __ret;
  58803 }
  58804 #else
  58805 __ai __attribute__((target("neon"))) poly8x16_t vqtbl3q_p8(poly8x16x3_t __p0, uint8x16_t __p1) {
  58806   poly8x16_t __ret;
  58807   poly8x16x3_t __rev0;
  58808   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58809   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58810   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58811   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58812   __ret = (poly8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev1, 36);
  58813   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58814   return __ret;
  58815 }
  58816 #endif
  58817 
  58818 #ifdef __LITTLE_ENDIAN__
  58819 __ai __attribute__((target("neon"))) uint8x16_t vqtbl3q_u8(uint8x16x3_t __p0, uint8x16_t __p1) {
  58820   uint8x16_t __ret;
  58821   __ret = (uint8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p1, 48);
  58822   return __ret;
  58823 }
  58824 #else
  58825 __ai __attribute__((target("neon"))) uint8x16_t vqtbl3q_u8(uint8x16x3_t __p0, uint8x16_t __p1) {
  58826   uint8x16_t __ret;
  58827   uint8x16x3_t __rev0;
  58828   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58829   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58830   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58831   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58832   __ret = (uint8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev1, 48);
  58833   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58834   return __ret;
  58835 }
  58836 #endif
  58837 
  58838 #ifdef __LITTLE_ENDIAN__
  58839 __ai __attribute__((target("neon"))) int8x16_t vqtbl3q_s8(int8x16x3_t __p0, uint8x16_t __p1) {
  58840   int8x16_t __ret;
  58841   __ret = (int8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p1, 32);
  58842   return __ret;
  58843 }
  58844 #else
  58845 __ai __attribute__((target("neon"))) int8x16_t vqtbl3q_s8(int8x16x3_t __p0, uint8x16_t __p1) {
  58846   int8x16_t __ret;
  58847   int8x16x3_t __rev0;
  58848   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58849   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58850   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58851   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58852   __ret = (int8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev1, 32);
  58853   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58854   return __ret;
  58855 }
  58856 #endif
  58857 
  58858 #ifdef __LITTLE_ENDIAN__
  58859 __ai __attribute__((target("neon"))) uint8x8_t vqtbl3_u8(uint8x16x3_t __p0, uint8x8_t __p1) {
  58860   uint8x8_t __ret;
  58861   __ret = (uint8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x8_t)__p1, 16);
  58862   return __ret;
  58863 }
  58864 #else
  58865 __ai __attribute__((target("neon"))) uint8x8_t vqtbl3_u8(uint8x16x3_t __p0, uint8x8_t __p1) {
  58866   uint8x8_t __ret;
  58867   uint8x16x3_t __rev0;
  58868   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58869   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58870   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58871   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58872   __ret = (uint8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x8_t)__rev1, 16);
  58873   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58874   return __ret;
  58875 }
  58876 #endif
  58877 
  58878 #ifdef __LITTLE_ENDIAN__
  58879 __ai __attribute__((target("neon"))) int8x8_t vqtbl3_s8(int8x16x3_t __p0, uint8x8_t __p1) {
  58880   int8x8_t __ret;
  58881   __ret = (int8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x8_t)__p1, 0);
  58882   return __ret;
  58883 }
  58884 #else
  58885 __ai __attribute__((target("neon"))) int8x8_t vqtbl3_s8(int8x16x3_t __p0, uint8x8_t __p1) {
  58886   int8x8_t __ret;
  58887   int8x16x3_t __rev0;
  58888   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58889   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58890   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58891   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58892   __ret = (int8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x8_t)__rev1, 0);
  58893   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58894   return __ret;
  58895 }
  58896 #endif
  58897 
  58898 #ifdef __LITTLE_ENDIAN__
  58899 __ai __attribute__((target("neon"))) poly8x8_t vqtbl4_p8(poly8x16x4_t __p0, uint8x8_t __p1) {
  58900   poly8x8_t __ret;
  58901   __ret = (poly8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x8_t)__p1, 4);
  58902   return __ret;
  58903 }
  58904 #else
  58905 __ai __attribute__((target("neon"))) poly8x8_t vqtbl4_p8(poly8x16x4_t __p0, uint8x8_t __p1) {
  58906   poly8x8_t __ret;
  58907   poly8x16x4_t __rev0;
  58908   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58909   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58910   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58911   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58912   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58913   __ret = (poly8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x8_t)__rev1, 4);
  58914   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58915   return __ret;
  58916 }
  58917 #endif
  58918 
  58919 #ifdef __LITTLE_ENDIAN__
  58920 __ai __attribute__((target("neon"))) poly8x16_t vqtbl4q_p8(poly8x16x4_t __p0, uint8x16_t __p1) {
  58921   poly8x16_t __ret;
  58922   __ret = (poly8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x16_t)__p1, 36);
  58923   return __ret;
  58924 }
  58925 #else
  58926 __ai __attribute__((target("neon"))) poly8x16_t vqtbl4q_p8(poly8x16x4_t __p0, uint8x16_t __p1) {
  58927   poly8x16_t __ret;
  58928   poly8x16x4_t __rev0;
  58929   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58930   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58931   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58932   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58933   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58934   __ret = (poly8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x16_t)__rev1, 36);
  58935   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58936   return __ret;
  58937 }
  58938 #endif
  58939 
  58940 #ifdef __LITTLE_ENDIAN__
  58941 __ai __attribute__((target("neon"))) uint8x16_t vqtbl4q_u8(uint8x16x4_t __p0, uint8x16_t __p1) {
  58942   uint8x16_t __ret;
  58943   __ret = (uint8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x16_t)__p1, 48);
  58944   return __ret;
  58945 }
  58946 #else
  58947 __ai __attribute__((target("neon"))) uint8x16_t vqtbl4q_u8(uint8x16x4_t __p0, uint8x16_t __p1) {
  58948   uint8x16_t __ret;
  58949   uint8x16x4_t __rev0;
  58950   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58951   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58952   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58953   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58954   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58955   __ret = (uint8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x16_t)__rev1, 48);
  58956   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58957   return __ret;
  58958 }
  58959 #endif
  58960 
  58961 #ifdef __LITTLE_ENDIAN__
  58962 __ai __attribute__((target("neon"))) int8x16_t vqtbl4q_s8(int8x16x4_t __p0, uint8x16_t __p1) {
  58963   int8x16_t __ret;
  58964   __ret = (int8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x16_t)__p1, 32);
  58965   return __ret;
  58966 }
  58967 #else
  58968 __ai __attribute__((target("neon"))) int8x16_t vqtbl4q_s8(int8x16x4_t __p0, uint8x16_t __p1) {
  58969   int8x16_t __ret;
  58970   int8x16x4_t __rev0;
  58971   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58972   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58973   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58974   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58975   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58976   __ret = (int8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x16_t)__rev1, 32);
  58977   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58978   return __ret;
  58979 }
  58980 #endif
  58981 
  58982 #ifdef __LITTLE_ENDIAN__
  58983 __ai __attribute__((target("neon"))) uint8x8_t vqtbl4_u8(uint8x16x4_t __p0, uint8x8_t __p1) {
  58984   uint8x8_t __ret;
  58985   __ret = (uint8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x8_t)__p1, 16);
  58986   return __ret;
  58987 }
  58988 #else
  58989 __ai __attribute__((target("neon"))) uint8x8_t vqtbl4_u8(uint8x16x4_t __p0, uint8x8_t __p1) {
  58990   uint8x8_t __ret;
  58991   uint8x16x4_t __rev0;
  58992   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58993   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58994   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58995   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  58996   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  58997   __ret = (uint8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x8_t)__rev1, 16);
  58998   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  58999   return __ret;
  59000 }
  59001 #endif
  59002 
  59003 #ifdef __LITTLE_ENDIAN__
  59004 __ai __attribute__((target("neon"))) int8x8_t vqtbl4_s8(int8x16x4_t __p0, uint8x8_t __p1) {
  59005   int8x8_t __ret;
  59006   __ret = (int8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x8_t)__p1, 0);
  59007   return __ret;
  59008 }
  59009 #else
  59010 __ai __attribute__((target("neon"))) int8x8_t vqtbl4_s8(int8x16x4_t __p0, uint8x8_t __p1) {
  59011   int8x8_t __ret;
  59012   int8x16x4_t __rev0;
  59013   __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59014   __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59015   __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59016   __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59017   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  59018   __ret = (int8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x8_t)__rev1, 0);
  59019   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59020   return __ret;
  59021 }
  59022 #endif
  59023 
  59024 #ifdef __LITTLE_ENDIAN__
  59025 __ai __attribute__((target("neon"))) poly8x8_t vqtbx1_p8(poly8x8_t __p0, poly8x16_t __p1, uint8x8_t __p2) {
  59026   poly8x8_t __ret;
  59027   __ret = (poly8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__p0, (int8x16_t)__p1, (int8x8_t)__p2, 4);
  59028   return __ret;
  59029 }
  59030 #else
  59031 __ai __attribute__((target("neon"))) poly8x8_t vqtbx1_p8(poly8x8_t __p0, poly8x16_t __p1, uint8x8_t __p2) {
  59032   poly8x8_t __ret;
  59033   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59034   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59035   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59036   __ret = (poly8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, 4);
  59037   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59038   return __ret;
  59039 }
  59040 #endif
  59041 
  59042 #ifdef __LITTLE_ENDIAN__
  59043 __ai __attribute__((target("neon"))) poly8x16_t vqtbx1q_p8(poly8x16_t __p0, poly8x16_t __p1, uint8x16_t __p2) {
  59044   poly8x16_t __ret;
  59045   __ret = (poly8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 36);
  59046   return __ret;
  59047 }
  59048 #else
  59049 __ai __attribute__((target("neon"))) poly8x16_t vqtbx1q_p8(poly8x16_t __p0, poly8x16_t __p1, uint8x16_t __p2) {
  59050   poly8x16_t __ret;
  59051   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59052   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59053   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59054   __ret = (poly8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 36);
  59055   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59056   return __ret;
  59057 }
  59058 #endif
  59059 
  59060 #ifdef __LITTLE_ENDIAN__
  59061 __ai __attribute__((target("neon"))) uint8x16_t vqtbx1q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  59062   uint8x16_t __ret;
  59063   __ret = (uint8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48);
  59064   return __ret;
  59065 }
  59066 #else
  59067 __ai __attribute__((target("neon"))) uint8x16_t vqtbx1q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  59068   uint8x16_t __ret;
  59069   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59070   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59071   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59072   __ret = (uint8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48);
  59073   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59074   return __ret;
  59075 }
  59076 #endif
  59077 
  59078 #ifdef __LITTLE_ENDIAN__
  59079 __ai __attribute__((target("neon"))) int8x16_t vqtbx1q_s8(int8x16_t __p0, int8x16_t __p1, uint8x16_t __p2) {
  59080   int8x16_t __ret;
  59081   __ret = (int8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32);
  59082   return __ret;
  59083 }
  59084 #else
  59085 __ai __attribute__((target("neon"))) int8x16_t vqtbx1q_s8(int8x16_t __p0, int8x16_t __p1, uint8x16_t __p2) {
  59086   int8x16_t __ret;
  59087   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59088   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59089   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59090   __ret = (int8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32);
  59091   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59092   return __ret;
  59093 }
  59094 #endif
  59095 
  59096 #ifdef __LITTLE_ENDIAN__
  59097 __ai __attribute__((target("neon"))) uint8x8_t vqtbx1_u8(uint8x8_t __p0, uint8x16_t __p1, uint8x8_t __p2) {
  59098   uint8x8_t __ret;
  59099   __ret = (uint8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__p0, (int8x16_t)__p1, (int8x8_t)__p2, 16);
  59100   return __ret;
  59101 }
  59102 #else
  59103 __ai __attribute__((target("neon"))) uint8x8_t vqtbx1_u8(uint8x8_t __p0, uint8x16_t __p1, uint8x8_t __p2) {
  59104   uint8x8_t __ret;
  59105   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59106   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59107   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59108   __ret = (uint8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, 16);
  59109   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59110   return __ret;
  59111 }
  59112 #endif
  59113 
  59114 #ifdef __LITTLE_ENDIAN__
  59115 __ai __attribute__((target("neon"))) int8x8_t vqtbx1_s8(int8x8_t __p0, int8x16_t __p1, uint8x8_t __p2) {
  59116   int8x8_t __ret;
  59117   __ret = (int8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__p0, (int8x16_t)__p1, (int8x8_t)__p2, 0);
  59118   return __ret;
  59119 }
  59120 #else
  59121 __ai __attribute__((target("neon"))) int8x8_t vqtbx1_s8(int8x8_t __p0, int8x16_t __p1, uint8x8_t __p2) {
  59122   int8x8_t __ret;
  59123   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59124   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59125   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59126   __ret = (int8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, 0);
  59127   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59128   return __ret;
  59129 }
  59130 #endif
  59131 
  59132 #ifdef __LITTLE_ENDIAN__
  59133 __ai __attribute__((target("neon"))) poly8x8_t vqtbx2_p8(poly8x8_t __p0, poly8x16x2_t __p1, uint8x8_t __p2) {
  59134   poly8x8_t __ret;
  59135   __ret = (poly8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x8_t)__p2, 4);
  59136   return __ret;
  59137 }
  59138 #else
  59139 __ai __attribute__((target("neon"))) poly8x8_t vqtbx2_p8(poly8x8_t __p0, poly8x16x2_t __p1, uint8x8_t __p2) {
  59140   poly8x8_t __ret;
  59141   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59142   poly8x16x2_t __rev1;
  59143   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59144   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59145   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59146   __ret = (poly8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x8_t)__rev2, 4);
  59147   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59148   return __ret;
  59149 }
  59150 #endif
  59151 
  59152 #ifdef __LITTLE_ENDIAN__
  59153 __ai __attribute__((target("neon"))) poly8x16_t vqtbx2q_p8(poly8x16_t __p0, poly8x16x2_t __p1, uint8x16_t __p2) {
  59154   poly8x16_t __ret;
  59155   __ret = (poly8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p2, 36);
  59156   return __ret;
  59157 }
  59158 #else
  59159 __ai __attribute__((target("neon"))) poly8x16_t vqtbx2q_p8(poly8x16_t __p0, poly8x16x2_t __p1, uint8x16_t __p2) {
  59160   poly8x16_t __ret;
  59161   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59162   poly8x16x2_t __rev1;
  59163   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59164   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59165   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59166   __ret = (poly8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev2, 36);
  59167   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59168   return __ret;
  59169 }
  59170 #endif
  59171 
  59172 #ifdef __LITTLE_ENDIAN__
  59173 __ai __attribute__((target("neon"))) uint8x16_t vqtbx2q_u8(uint8x16_t __p0, uint8x16x2_t __p1, uint8x16_t __p2) {
  59174   uint8x16_t __ret;
  59175   __ret = (uint8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p2, 48);
  59176   return __ret;
  59177 }
  59178 #else
  59179 __ai __attribute__((target("neon"))) uint8x16_t vqtbx2q_u8(uint8x16_t __p0, uint8x16x2_t __p1, uint8x16_t __p2) {
  59180   uint8x16_t __ret;
  59181   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59182   uint8x16x2_t __rev1;
  59183   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59184   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59185   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59186   __ret = (uint8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev2, 48);
  59187   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59188   return __ret;
  59189 }
  59190 #endif
  59191 
  59192 #ifdef __LITTLE_ENDIAN__
  59193 __ai __attribute__((target("neon"))) int8x16_t vqtbx2q_s8(int8x16_t __p0, int8x16x2_t __p1, uint8x16_t __p2) {
  59194   int8x16_t __ret;
  59195   __ret = (int8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p2, 32);
  59196   return __ret;
  59197 }
  59198 #else
  59199 __ai __attribute__((target("neon"))) int8x16_t vqtbx2q_s8(int8x16_t __p0, int8x16x2_t __p1, uint8x16_t __p2) {
  59200   int8x16_t __ret;
  59201   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59202   int8x16x2_t __rev1;
  59203   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59204   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59205   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59206   __ret = (int8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev2, 32);
  59207   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59208   return __ret;
  59209 }
  59210 #endif
  59211 
  59212 #ifdef __LITTLE_ENDIAN__
  59213 __ai __attribute__((target("neon"))) uint8x8_t vqtbx2_u8(uint8x8_t __p0, uint8x16x2_t __p1, uint8x8_t __p2) {
  59214   uint8x8_t __ret;
  59215   __ret = (uint8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x8_t)__p2, 16);
  59216   return __ret;
  59217 }
  59218 #else
  59219 __ai __attribute__((target("neon"))) uint8x8_t vqtbx2_u8(uint8x8_t __p0, uint8x16x2_t __p1, uint8x8_t __p2) {
  59220   uint8x8_t __ret;
  59221   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59222   uint8x16x2_t __rev1;
  59223   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59224   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59225   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59226   __ret = (uint8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x8_t)__rev2, 16);
  59227   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59228   return __ret;
  59229 }
  59230 #endif
  59231 
  59232 #ifdef __LITTLE_ENDIAN__
  59233 __ai __attribute__((target("neon"))) int8x8_t vqtbx2_s8(int8x8_t __p0, int8x16x2_t __p1, uint8x8_t __p2) {
  59234   int8x8_t __ret;
  59235   __ret = (int8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x8_t)__p2, 0);
  59236   return __ret;
  59237 }
  59238 #else
  59239 __ai __attribute__((target("neon"))) int8x8_t vqtbx2_s8(int8x8_t __p0, int8x16x2_t __p1, uint8x8_t __p2) {
  59240   int8x8_t __ret;
  59241   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59242   int8x16x2_t __rev1;
  59243   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59244   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59245   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59246   __ret = (int8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x8_t)__rev2, 0);
  59247   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59248   return __ret;
  59249 }
  59250 #endif
  59251 
  59252 #ifdef __LITTLE_ENDIAN__
  59253 __ai __attribute__((target("neon"))) poly8x8_t vqtbx3_p8(poly8x8_t __p0, poly8x16x3_t __p1, uint8x8_t __p2) {
  59254   poly8x8_t __ret;
  59255   __ret = (poly8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x8_t)__p2, 4);
  59256   return __ret;
  59257 }
  59258 #else
  59259 __ai __attribute__((target("neon"))) poly8x8_t vqtbx3_p8(poly8x8_t __p0, poly8x16x3_t __p1, uint8x8_t __p2) {
  59260   poly8x8_t __ret;
  59261   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59262   poly8x16x3_t __rev1;
  59263   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59264   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59265   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59266   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59267   __ret = (poly8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x8_t)__rev2, 4);
  59268   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59269   return __ret;
  59270 }
  59271 #endif
  59272 
  59273 #ifdef __LITTLE_ENDIAN__
  59274 __ai __attribute__((target("neon"))) poly8x16_t vqtbx3q_p8(poly8x16_t __p0, poly8x16x3_t __p1, uint8x16_t __p2) {
  59275   poly8x16_t __ret;
  59276   __ret = (poly8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p2, 36);
  59277   return __ret;
  59278 }
  59279 #else
  59280 __ai __attribute__((target("neon"))) poly8x16_t vqtbx3q_p8(poly8x16_t __p0, poly8x16x3_t __p1, uint8x16_t __p2) {
  59281   poly8x16_t __ret;
  59282   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59283   poly8x16x3_t __rev1;
  59284   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59285   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59286   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59287   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59288   __ret = (poly8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev2, 36);
  59289   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59290   return __ret;
  59291 }
  59292 #endif
  59293 
  59294 #ifdef __LITTLE_ENDIAN__
  59295 __ai __attribute__((target("neon"))) uint8x16_t vqtbx3q_u8(uint8x16_t __p0, uint8x16x3_t __p1, uint8x16_t __p2) {
  59296   uint8x16_t __ret;
  59297   __ret = (uint8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p2, 48);
  59298   return __ret;
  59299 }
  59300 #else
  59301 __ai __attribute__((target("neon"))) uint8x16_t vqtbx3q_u8(uint8x16_t __p0, uint8x16x3_t __p1, uint8x16_t __p2) {
  59302   uint8x16_t __ret;
  59303   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59304   uint8x16x3_t __rev1;
  59305   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59306   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59307   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59308   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59309   __ret = (uint8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev2, 48);
  59310   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59311   return __ret;
  59312 }
  59313 #endif
  59314 
  59315 #ifdef __LITTLE_ENDIAN__
  59316 __ai __attribute__((target("neon"))) int8x16_t vqtbx3q_s8(int8x16_t __p0, int8x16x3_t __p1, uint8x16_t __p2) {
  59317   int8x16_t __ret;
  59318   __ret = (int8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p2, 32);
  59319   return __ret;
  59320 }
  59321 #else
  59322 __ai __attribute__((target("neon"))) int8x16_t vqtbx3q_s8(int8x16_t __p0, int8x16x3_t __p1, uint8x16_t __p2) {
  59323   int8x16_t __ret;
  59324   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59325   int8x16x3_t __rev1;
  59326   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59327   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59328   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59329   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59330   __ret = (int8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev2, 32);
  59331   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59332   return __ret;
  59333 }
  59334 #endif
  59335 
  59336 #ifdef __LITTLE_ENDIAN__
  59337 __ai __attribute__((target("neon"))) uint8x8_t vqtbx3_u8(uint8x8_t __p0, uint8x16x3_t __p1, uint8x8_t __p2) {
  59338   uint8x8_t __ret;
  59339   __ret = (uint8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x8_t)__p2, 16);
  59340   return __ret;
  59341 }
  59342 #else
  59343 __ai __attribute__((target("neon"))) uint8x8_t vqtbx3_u8(uint8x8_t __p0, uint8x16x3_t __p1, uint8x8_t __p2) {
  59344   uint8x8_t __ret;
  59345   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59346   uint8x16x3_t __rev1;
  59347   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59348   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59349   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59350   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59351   __ret = (uint8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x8_t)__rev2, 16);
  59352   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59353   return __ret;
  59354 }
  59355 #endif
  59356 
  59357 #ifdef __LITTLE_ENDIAN__
  59358 __ai __attribute__((target("neon"))) int8x8_t vqtbx3_s8(int8x8_t __p0, int8x16x3_t __p1, uint8x8_t __p2) {
  59359   int8x8_t __ret;
  59360   __ret = (int8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x8_t)__p2, 0);
  59361   return __ret;
  59362 }
  59363 #else
  59364 __ai __attribute__((target("neon"))) int8x8_t vqtbx3_s8(int8x8_t __p0, int8x16x3_t __p1, uint8x8_t __p2) {
  59365   int8x8_t __ret;
  59366   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59367   int8x16x3_t __rev1;
  59368   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59369   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59370   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59371   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59372   __ret = (int8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x8_t)__rev2, 0);
  59373   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59374   return __ret;
  59375 }
  59376 #endif
  59377 
  59378 #ifdef __LITTLE_ENDIAN__
  59379 __ai __attribute__((target("neon"))) poly8x8_t vqtbx4_p8(poly8x8_t __p0, poly8x16x4_t __p1, uint8x8_t __p2) {
  59380   poly8x8_t __ret;
  59381   __ret = (poly8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x8_t)__p2, 4);
  59382   return __ret;
  59383 }
  59384 #else
  59385 __ai __attribute__((target("neon"))) poly8x8_t vqtbx4_p8(poly8x8_t __p0, poly8x16x4_t __p1, uint8x8_t __p2) {
  59386   poly8x8_t __ret;
  59387   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59388   poly8x16x4_t __rev1;
  59389   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59390   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59391   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59392   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59393   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59394   __ret = (poly8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x8_t)__rev2, 4);
  59395   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59396   return __ret;
  59397 }
  59398 #endif
  59399 
  59400 #ifdef __LITTLE_ENDIAN__
  59401 __ai __attribute__((target("neon"))) poly8x16_t vqtbx4q_p8(poly8x16_t __p0, poly8x16x4_t __p1, uint8x16_t __p2) {
  59402   poly8x16_t __ret;
  59403   __ret = (poly8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x16_t)__p2, 36);
  59404   return __ret;
  59405 }
  59406 #else
  59407 __ai __attribute__((target("neon"))) poly8x16_t vqtbx4q_p8(poly8x16_t __p0, poly8x16x4_t __p1, uint8x16_t __p2) {
  59408   poly8x16_t __ret;
  59409   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59410   poly8x16x4_t __rev1;
  59411   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59412   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59413   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59414   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59415   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59416   __ret = (poly8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x16_t)__rev2, 36);
  59417   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59418   return __ret;
  59419 }
  59420 #endif
  59421 
  59422 #ifdef __LITTLE_ENDIAN__
  59423 __ai __attribute__((target("neon"))) uint8x16_t vqtbx4q_u8(uint8x16_t __p0, uint8x16x4_t __p1, uint8x16_t __p2) {
  59424   uint8x16_t __ret;
  59425   __ret = (uint8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x16_t)__p2, 48);
  59426   return __ret;
  59427 }
  59428 #else
  59429 __ai __attribute__((target("neon"))) uint8x16_t vqtbx4q_u8(uint8x16_t __p0, uint8x16x4_t __p1, uint8x16_t __p2) {
  59430   uint8x16_t __ret;
  59431   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59432   uint8x16x4_t __rev1;
  59433   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59434   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59435   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59436   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59437   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59438   __ret = (uint8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x16_t)__rev2, 48);
  59439   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59440   return __ret;
  59441 }
  59442 #endif
  59443 
  59444 #ifdef __LITTLE_ENDIAN__
  59445 __ai __attribute__((target("neon"))) int8x16_t vqtbx4q_s8(int8x16_t __p0, int8x16x4_t __p1, uint8x16_t __p2) {
  59446   int8x16_t __ret;
  59447   __ret = (int8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x16_t)__p2, 32);
  59448   return __ret;
  59449 }
  59450 #else
  59451 __ai __attribute__((target("neon"))) int8x16_t vqtbx4q_s8(int8x16_t __p0, int8x16x4_t __p1, uint8x16_t __p2) {
  59452   int8x16_t __ret;
  59453   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59454   int8x16x4_t __rev1;
  59455   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59456   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59457   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59458   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59459   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59460   __ret = (int8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x16_t)__rev2, 32);
  59461   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59462   return __ret;
  59463 }
  59464 #endif
  59465 
  59466 #ifdef __LITTLE_ENDIAN__
  59467 __ai __attribute__((target("neon"))) uint8x8_t vqtbx4_u8(uint8x8_t __p0, uint8x16x4_t __p1, uint8x8_t __p2) {
  59468   uint8x8_t __ret;
  59469   __ret = (uint8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x8_t)__p2, 16);
  59470   return __ret;
  59471 }
  59472 #else
  59473 __ai __attribute__((target("neon"))) uint8x8_t vqtbx4_u8(uint8x8_t __p0, uint8x16x4_t __p1, uint8x8_t __p2) {
  59474   uint8x8_t __ret;
  59475   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59476   uint8x16x4_t __rev1;
  59477   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59478   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59479   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59480   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59481   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59482   __ret = (uint8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x8_t)__rev2, 16);
  59483   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59484   return __ret;
  59485 }
  59486 #endif
  59487 
  59488 #ifdef __LITTLE_ENDIAN__
  59489 __ai __attribute__((target("neon"))) int8x8_t vqtbx4_s8(int8x8_t __p0, int8x16x4_t __p1, uint8x8_t __p2) {
  59490   int8x8_t __ret;
  59491   __ret = (int8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x8_t)__p2, 0);
  59492   return __ret;
  59493 }
  59494 #else
  59495 __ai __attribute__((target("neon"))) int8x8_t vqtbx4_s8(int8x8_t __p0, int8x16x4_t __p1, uint8x8_t __p2) {
  59496   int8x8_t __ret;
  59497   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59498   int8x16x4_t __rev1;
  59499   __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59500   __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59501   __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59502   __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59503   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59504   __ret = (int8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x8_t)__rev2, 0);
  59505   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59506   return __ret;
  59507 }
  59508 #endif
  59509 
  59510 #ifdef __LITTLE_ENDIAN__
  59511 __ai __attribute__((target("neon"))) uint16x8_t vraddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  59512   uint16x8_t __ret;
  59513   __ret = vcombine_u16(__p0, vraddhn_u32(__p1, __p2));
  59514   return __ret;
  59515 }
  59516 #else
  59517 __ai __attribute__((target("neon"))) uint16x8_t vraddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  59518   uint16x8_t __ret;
  59519   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  59520   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  59521   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  59522   __ret = __noswap_vcombine_u16(__rev0, __noswap_vraddhn_u32(__rev1, __rev2));
  59523   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59524   return __ret;
  59525 }
  59526 #endif
  59527 
  59528 #ifdef __LITTLE_ENDIAN__
  59529 __ai __attribute__((target("neon"))) uint32x4_t vraddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  59530   uint32x4_t __ret;
  59531   __ret = vcombine_u32(__p0, vraddhn_u64(__p1, __p2));
  59532   return __ret;
  59533 }
  59534 #else
  59535 __ai __attribute__((target("neon"))) uint32x4_t vraddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  59536   uint32x4_t __ret;
  59537   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  59538   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  59539   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  59540   __ret = __noswap_vcombine_u32(__rev0, __noswap_vraddhn_u64(__rev1, __rev2));
  59541   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  59542   return __ret;
  59543 }
  59544 #endif
  59545 
  59546 #ifdef __LITTLE_ENDIAN__
  59547 __ai __attribute__((target("neon"))) uint8x16_t vraddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  59548   uint8x16_t __ret;
  59549   __ret = vcombine_u8(__p0, vraddhn_u16(__p1, __p2));
  59550   return __ret;
  59551 }
  59552 #else
  59553 __ai __attribute__((target("neon"))) uint8x16_t vraddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  59554   uint8x16_t __ret;
  59555   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59556   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  59557   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59558   __ret = __noswap_vcombine_u8(__rev0, __noswap_vraddhn_u16(__rev1, __rev2));
  59559   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59560   return __ret;
  59561 }
  59562 #endif
  59563 
  59564 #ifdef __LITTLE_ENDIAN__
  59565 __ai __attribute__((target("neon"))) int16x8_t vraddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  59566   int16x8_t __ret;
  59567   __ret = vcombine_s16(__p0, vraddhn_s32(__p1, __p2));
  59568   return __ret;
  59569 }
  59570 #else
  59571 __ai __attribute__((target("neon"))) int16x8_t vraddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  59572   int16x8_t __ret;
  59573   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  59574   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  59575   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  59576   __ret = __noswap_vcombine_s16(__rev0, __noswap_vraddhn_s32(__rev1, __rev2));
  59577   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59578   return __ret;
  59579 }
  59580 #endif
  59581 
  59582 #ifdef __LITTLE_ENDIAN__
  59583 __ai __attribute__((target("neon"))) int32x4_t vraddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  59584   int32x4_t __ret;
  59585   __ret = vcombine_s32(__p0, vraddhn_s64(__p1, __p2));
  59586   return __ret;
  59587 }
  59588 #else
  59589 __ai __attribute__((target("neon"))) int32x4_t vraddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  59590   int32x4_t __ret;
  59591   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  59592   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  59593   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  59594   __ret = __noswap_vcombine_s32(__rev0, __noswap_vraddhn_s64(__rev1, __rev2));
  59595   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  59596   return __ret;
  59597 }
  59598 #endif
  59599 
  59600 #ifdef __LITTLE_ENDIAN__
  59601 __ai __attribute__((target("neon"))) int8x16_t vraddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  59602   int8x16_t __ret;
  59603   __ret = vcombine_s8(__p0, vraddhn_s16(__p1, __p2));
  59604   return __ret;
  59605 }
  59606 #else
  59607 __ai __attribute__((target("neon"))) int8x16_t vraddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  59608   int8x16_t __ret;
  59609   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59610   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  59611   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  59612   __ret = __noswap_vcombine_s8(__rev0, __noswap_vraddhn_s16(__rev1, __rev2));
  59613   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59614   return __ret;
  59615 }
  59616 #endif
  59617 
  59618 #ifdef __LITTLE_ENDIAN__
  59619 __ai __attribute__((target("neon"))) poly8x8_t vrbit_p8(poly8x8_t __p0) {
  59620   poly8x8_t __ret;
  59621   __ret = (poly8x8_t) __builtin_neon_vrbit_v((int8x8_t)__p0, 4);
  59622   return __ret;
  59623 }
  59624 #else
  59625 __ai __attribute__((target("neon"))) poly8x8_t vrbit_p8(poly8x8_t __p0) {
  59626   poly8x8_t __ret;
  59627   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59628   __ret = (poly8x8_t) __builtin_neon_vrbit_v((int8x8_t)__rev0, 4);
  59629   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59630   return __ret;
  59631 }
  59632 #endif
  59633 
  59634 #ifdef __LITTLE_ENDIAN__
  59635 __ai __attribute__((target("neon"))) poly8x16_t vrbitq_p8(poly8x16_t __p0) {
  59636   poly8x16_t __ret;
  59637   __ret = (poly8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__p0, 36);
  59638   return __ret;
  59639 }
  59640 #else
  59641 __ai __attribute__((target("neon"))) poly8x16_t vrbitq_p8(poly8x16_t __p0) {
  59642   poly8x16_t __ret;
  59643   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59644   __ret = (poly8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__rev0, 36);
  59645   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59646   return __ret;
  59647 }
  59648 #endif
  59649 
  59650 #ifdef __LITTLE_ENDIAN__
  59651 __ai __attribute__((target("neon"))) uint8x16_t vrbitq_u8(uint8x16_t __p0) {
  59652   uint8x16_t __ret;
  59653   __ret = (uint8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__p0, 48);
  59654   return __ret;
  59655 }
  59656 #else
  59657 __ai __attribute__((target("neon"))) uint8x16_t vrbitq_u8(uint8x16_t __p0) {
  59658   uint8x16_t __ret;
  59659   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59660   __ret = (uint8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__rev0, 48);
  59661   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59662   return __ret;
  59663 }
  59664 #endif
  59665 
  59666 #ifdef __LITTLE_ENDIAN__
  59667 __ai __attribute__((target("neon"))) int8x16_t vrbitq_s8(int8x16_t __p0) {
  59668   int8x16_t __ret;
  59669   __ret = (int8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__p0, 32);
  59670   return __ret;
  59671 }
  59672 #else
  59673 __ai __attribute__((target("neon"))) int8x16_t vrbitq_s8(int8x16_t __p0) {
  59674   int8x16_t __ret;
  59675   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59676   __ret = (int8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__rev0, 32);
  59677   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  59678   return __ret;
  59679 }
  59680 #endif
  59681 
  59682 #ifdef __LITTLE_ENDIAN__
  59683 __ai __attribute__((target("neon"))) uint8x8_t vrbit_u8(uint8x8_t __p0) {
  59684   uint8x8_t __ret;
  59685   __ret = (uint8x8_t) __builtin_neon_vrbit_v((int8x8_t)__p0, 16);
  59686   return __ret;
  59687 }
  59688 #else
  59689 __ai __attribute__((target("neon"))) uint8x8_t vrbit_u8(uint8x8_t __p0) {
  59690   uint8x8_t __ret;
  59691   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59692   __ret = (uint8x8_t) __builtin_neon_vrbit_v((int8x8_t)__rev0, 16);
  59693   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59694   return __ret;
  59695 }
  59696 #endif
  59697 
  59698 #ifdef __LITTLE_ENDIAN__
  59699 __ai __attribute__((target("neon"))) int8x8_t vrbit_s8(int8x8_t __p0) {
  59700   int8x8_t __ret;
  59701   __ret = (int8x8_t) __builtin_neon_vrbit_v((int8x8_t)__p0, 0);
  59702   return __ret;
  59703 }
  59704 #else
  59705 __ai __attribute__((target("neon"))) int8x8_t vrbit_s8(int8x8_t __p0) {
  59706   int8x8_t __ret;
  59707   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  59708   __ret = (int8x8_t) __builtin_neon_vrbit_v((int8x8_t)__rev0, 0);
  59709   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  59710   return __ret;
  59711 }
  59712 #endif
  59713 
  59714 #ifdef __LITTLE_ENDIAN__
  59715 __ai __attribute__((target("neon"))) float64x2_t vrecpeq_f64(float64x2_t __p0) {
  59716   float64x2_t __ret;
  59717   __ret = (float64x2_t) __builtin_neon_vrecpeq_v((int8x16_t)__p0, 42);
  59718   return __ret;
  59719 }
  59720 #else
  59721 __ai __attribute__((target("neon"))) float64x2_t vrecpeq_f64(float64x2_t __p0) {
  59722   float64x2_t __ret;
  59723   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  59724   __ret = (float64x2_t) __builtin_neon_vrecpeq_v((int8x16_t)__rev0, 42);
  59725   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  59726   return __ret;
  59727 }
  59728 #endif
  59729 
  59730 __ai __attribute__((target("neon"))) float64x1_t vrecpe_f64(float64x1_t __p0) {
  59731   float64x1_t __ret;
  59732   __ret = (float64x1_t) __builtin_neon_vrecpe_v((int8x8_t)__p0, 10);
  59733   return __ret;
  59734 }
  59735 __ai __attribute__((target("neon"))) float64_t vrecped_f64(float64_t __p0) {
  59736   float64_t __ret;
  59737   __ret = (float64_t) __builtin_neon_vrecped_f64(__p0);
  59738   return __ret;
  59739 }
  59740 __ai __attribute__((target("neon"))) float32_t vrecpes_f32(float32_t __p0) {
  59741   float32_t __ret;
  59742   __ret = (float32_t) __builtin_neon_vrecpes_f32(__p0);
  59743   return __ret;
  59744 }
  59745 #ifdef __LITTLE_ENDIAN__
  59746 __ai __attribute__((target("neon"))) float64x2_t vrecpsq_f64(float64x2_t __p0, float64x2_t __p1) {
  59747   float64x2_t __ret;
  59748   __ret = (float64x2_t) __builtin_neon_vrecpsq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  59749   return __ret;
  59750 }
  59751 #else
  59752 __ai __attribute__((target("neon"))) float64x2_t vrecpsq_f64(float64x2_t __p0, float64x2_t __p1) {
  59753   float64x2_t __ret;
  59754   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  59755   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  59756   __ret = (float64x2_t) __builtin_neon_vrecpsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  59757   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  59758   return __ret;
  59759 }
  59760 #endif
  59761 
  59762 __ai __attribute__((target("neon"))) float64x1_t vrecps_f64(float64x1_t __p0, float64x1_t __p1) {
  59763   float64x1_t __ret;
  59764   __ret = (float64x1_t) __builtin_neon_vrecps_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  59765   return __ret;
  59766 }
  59767 __ai __attribute__((target("neon"))) float64_t vrecpsd_f64(float64_t __p0, float64_t __p1) {
  59768   float64_t __ret;
  59769   __ret = (float64_t) __builtin_neon_vrecpsd_f64(__p0, __p1);
  59770   return __ret;
  59771 }
  59772 __ai __attribute__((target("neon"))) float32_t vrecpss_f32(float32_t __p0, float32_t __p1) {
  59773   float32_t __ret;
  59774   __ret = (float32_t) __builtin_neon_vrecpss_f32(__p0, __p1);
  59775   return __ret;
  59776 }
  59777 __ai __attribute__((target("neon"))) float64_t vrecpxd_f64(float64_t __p0) {
  59778   float64_t __ret;
  59779   __ret = (float64_t) __builtin_neon_vrecpxd_f64(__p0);
  59780   return __ret;
  59781 }
  59782 __ai __attribute__((target("neon"))) float32_t vrecpxs_f32(float32_t __p0) {
  59783   float32_t __ret;
  59784   __ret = (float32_t) __builtin_neon_vrecpxs_f32(__p0);
  59785   return __ret;
  59786 }
  59787 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_p64(poly64x1_t __p0) {
  59788   poly8x8_t __ret;
  59789   __ret = (poly8x8_t)(__p0);
  59790   return __ret;
  59791 }
  59792 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_p16(poly16x4_t __p0) {
  59793   poly8x8_t __ret;
  59794   __ret = (poly8x8_t)(__p0);
  59795   return __ret;
  59796 }
  59797 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u8(uint8x8_t __p0) {
  59798   poly8x8_t __ret;
  59799   __ret = (poly8x8_t)(__p0);
  59800   return __ret;
  59801 }
  59802 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u32(uint32x2_t __p0) {
  59803   poly8x8_t __ret;
  59804   __ret = (poly8x8_t)(__p0);
  59805   return __ret;
  59806 }
  59807 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u64(uint64x1_t __p0) {
  59808   poly8x8_t __ret;
  59809   __ret = (poly8x8_t)(__p0);
  59810   return __ret;
  59811 }
  59812 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u16(uint16x4_t __p0) {
  59813   poly8x8_t __ret;
  59814   __ret = (poly8x8_t)(__p0);
  59815   return __ret;
  59816 }
  59817 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s8(int8x8_t __p0) {
  59818   poly8x8_t __ret;
  59819   __ret = (poly8x8_t)(__p0);
  59820   return __ret;
  59821 }
  59822 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f64(float64x1_t __p0) {
  59823   poly8x8_t __ret;
  59824   __ret = (poly8x8_t)(__p0);
  59825   return __ret;
  59826 }
  59827 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f32(float32x2_t __p0) {
  59828   poly8x8_t __ret;
  59829   __ret = (poly8x8_t)(__p0);
  59830   return __ret;
  59831 }
  59832 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f16(float16x4_t __p0) {
  59833   poly8x8_t __ret;
  59834   __ret = (poly8x8_t)(__p0);
  59835   return __ret;
  59836 }
  59837 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s32(int32x2_t __p0) {
  59838   poly8x8_t __ret;
  59839   __ret = (poly8x8_t)(__p0);
  59840   return __ret;
  59841 }
  59842 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s64(int64x1_t __p0) {
  59843   poly8x8_t __ret;
  59844   __ret = (poly8x8_t)(__p0);
  59845   return __ret;
  59846 }
  59847 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_mf8(mfloat8x8_t __p0) {
  59848   poly8x8_t __ret;
  59849   __ret = (poly8x8_t)(__p0);
  59850   return __ret;
  59851 }
  59852 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s16(int16x4_t __p0) {
  59853   poly8x8_t __ret;
  59854   __ret = (poly8x8_t)(__p0);
  59855   return __ret;
  59856 }
  59857 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_p8(poly8x8_t __p0) {
  59858   poly64x1_t __ret;
  59859   __ret = (poly64x1_t)(__p0);
  59860   return __ret;
  59861 }
  59862 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_p16(poly16x4_t __p0) {
  59863   poly64x1_t __ret;
  59864   __ret = (poly64x1_t)(__p0);
  59865   return __ret;
  59866 }
  59867 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u8(uint8x8_t __p0) {
  59868   poly64x1_t __ret;
  59869   __ret = (poly64x1_t)(__p0);
  59870   return __ret;
  59871 }
  59872 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u32(uint32x2_t __p0) {
  59873   poly64x1_t __ret;
  59874   __ret = (poly64x1_t)(__p0);
  59875   return __ret;
  59876 }
  59877 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u64(uint64x1_t __p0) {
  59878   poly64x1_t __ret;
  59879   __ret = (poly64x1_t)(__p0);
  59880   return __ret;
  59881 }
  59882 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u16(uint16x4_t __p0) {
  59883   poly64x1_t __ret;
  59884   __ret = (poly64x1_t)(__p0);
  59885   return __ret;
  59886 }
  59887 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s8(int8x8_t __p0) {
  59888   poly64x1_t __ret;
  59889   __ret = (poly64x1_t)(__p0);
  59890   return __ret;
  59891 }
  59892 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_f64(float64x1_t __p0) {
  59893   poly64x1_t __ret;
  59894   __ret = (poly64x1_t)(__p0);
  59895   return __ret;
  59896 }
  59897 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_f32(float32x2_t __p0) {
  59898   poly64x1_t __ret;
  59899   __ret = (poly64x1_t)(__p0);
  59900   return __ret;
  59901 }
  59902 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_f16(float16x4_t __p0) {
  59903   poly64x1_t __ret;
  59904   __ret = (poly64x1_t)(__p0);
  59905   return __ret;
  59906 }
  59907 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s32(int32x2_t __p0) {
  59908   poly64x1_t __ret;
  59909   __ret = (poly64x1_t)(__p0);
  59910   return __ret;
  59911 }
  59912 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s64(int64x1_t __p0) {
  59913   poly64x1_t __ret;
  59914   __ret = (poly64x1_t)(__p0);
  59915   return __ret;
  59916 }
  59917 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_mf8(mfloat8x8_t __p0) {
  59918   poly64x1_t __ret;
  59919   __ret = (poly64x1_t)(__p0);
  59920   return __ret;
  59921 }
  59922 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s16(int16x4_t __p0) {
  59923   poly64x1_t __ret;
  59924   __ret = (poly64x1_t)(__p0);
  59925   return __ret;
  59926 }
  59927 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_p8(poly8x8_t __p0) {
  59928   poly16x4_t __ret;
  59929   __ret = (poly16x4_t)(__p0);
  59930   return __ret;
  59931 }
  59932 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_p64(poly64x1_t __p0) {
  59933   poly16x4_t __ret;
  59934   __ret = (poly16x4_t)(__p0);
  59935   return __ret;
  59936 }
  59937 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u8(uint8x8_t __p0) {
  59938   poly16x4_t __ret;
  59939   __ret = (poly16x4_t)(__p0);
  59940   return __ret;
  59941 }
  59942 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u32(uint32x2_t __p0) {
  59943   poly16x4_t __ret;
  59944   __ret = (poly16x4_t)(__p0);
  59945   return __ret;
  59946 }
  59947 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u64(uint64x1_t __p0) {
  59948   poly16x4_t __ret;
  59949   __ret = (poly16x4_t)(__p0);
  59950   return __ret;
  59951 }
  59952 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u16(uint16x4_t __p0) {
  59953   poly16x4_t __ret;
  59954   __ret = (poly16x4_t)(__p0);
  59955   return __ret;
  59956 }
  59957 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s8(int8x8_t __p0) {
  59958   poly16x4_t __ret;
  59959   __ret = (poly16x4_t)(__p0);
  59960   return __ret;
  59961 }
  59962 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f64(float64x1_t __p0) {
  59963   poly16x4_t __ret;
  59964   __ret = (poly16x4_t)(__p0);
  59965   return __ret;
  59966 }
  59967 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f32(float32x2_t __p0) {
  59968   poly16x4_t __ret;
  59969   __ret = (poly16x4_t)(__p0);
  59970   return __ret;
  59971 }
  59972 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f16(float16x4_t __p0) {
  59973   poly16x4_t __ret;
  59974   __ret = (poly16x4_t)(__p0);
  59975   return __ret;
  59976 }
  59977 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s32(int32x2_t __p0) {
  59978   poly16x4_t __ret;
  59979   __ret = (poly16x4_t)(__p0);
  59980   return __ret;
  59981 }
  59982 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s64(int64x1_t __p0) {
  59983   poly16x4_t __ret;
  59984   __ret = (poly16x4_t)(__p0);
  59985   return __ret;
  59986 }
  59987 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_mf8(mfloat8x8_t __p0) {
  59988   poly16x4_t __ret;
  59989   __ret = (poly16x4_t)(__p0);
  59990   return __ret;
  59991 }
  59992 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s16(int16x4_t __p0) {
  59993   poly16x4_t __ret;
  59994   __ret = (poly16x4_t)(__p0);
  59995   return __ret;
  59996 }
  59997 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p128(poly128_t __p0) {
  59998   poly8x16_t __ret;
  59999   __ret = (poly8x16_t)(__p0);
  60000   return __ret;
  60001 }
  60002 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p64(poly64x2_t __p0) {
  60003   poly8x16_t __ret;
  60004   __ret = (poly8x16_t)(__p0);
  60005   return __ret;
  60006 }
  60007 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p16(poly16x8_t __p0) {
  60008   poly8x16_t __ret;
  60009   __ret = (poly8x16_t)(__p0);
  60010   return __ret;
  60011 }
  60012 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u8(uint8x16_t __p0) {
  60013   poly8x16_t __ret;
  60014   __ret = (poly8x16_t)(__p0);
  60015   return __ret;
  60016 }
  60017 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u32(uint32x4_t __p0) {
  60018   poly8x16_t __ret;
  60019   __ret = (poly8x16_t)(__p0);
  60020   return __ret;
  60021 }
  60022 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u64(uint64x2_t __p0) {
  60023   poly8x16_t __ret;
  60024   __ret = (poly8x16_t)(__p0);
  60025   return __ret;
  60026 }
  60027 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u16(uint16x8_t __p0) {
  60028   poly8x16_t __ret;
  60029   __ret = (poly8x16_t)(__p0);
  60030   return __ret;
  60031 }
  60032 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s8(int8x16_t __p0) {
  60033   poly8x16_t __ret;
  60034   __ret = (poly8x16_t)(__p0);
  60035   return __ret;
  60036 }
  60037 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f64(float64x2_t __p0) {
  60038   poly8x16_t __ret;
  60039   __ret = (poly8x16_t)(__p0);
  60040   return __ret;
  60041 }
  60042 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f32(float32x4_t __p0) {
  60043   poly8x16_t __ret;
  60044   __ret = (poly8x16_t)(__p0);
  60045   return __ret;
  60046 }
  60047 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f16(float16x8_t __p0) {
  60048   poly8x16_t __ret;
  60049   __ret = (poly8x16_t)(__p0);
  60050   return __ret;
  60051 }
  60052 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s32(int32x4_t __p0) {
  60053   poly8x16_t __ret;
  60054   __ret = (poly8x16_t)(__p0);
  60055   return __ret;
  60056 }
  60057 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s64(int64x2_t __p0) {
  60058   poly8x16_t __ret;
  60059   __ret = (poly8x16_t)(__p0);
  60060   return __ret;
  60061 }
  60062 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_mf8(mfloat8x16_t __p0) {
  60063   poly8x16_t __ret;
  60064   __ret = (poly8x16_t)(__p0);
  60065   return __ret;
  60066 }
  60067 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s16(int16x8_t __p0) {
  60068   poly8x16_t __ret;
  60069   __ret = (poly8x16_t)(__p0);
  60070   return __ret;
  60071 }
  60072 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_p8(poly8x16_t __p0) {
  60073   poly128_t __ret;
  60074   __ret = (poly128_t)(__p0);
  60075   return __ret;
  60076 }
  60077 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_p64(poly64x2_t __p0) {
  60078   poly128_t __ret;
  60079   __ret = (poly128_t)(__p0);
  60080   return __ret;
  60081 }
  60082 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_p16(poly16x8_t __p0) {
  60083   poly128_t __ret;
  60084   __ret = (poly128_t)(__p0);
  60085   return __ret;
  60086 }
  60087 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u8(uint8x16_t __p0) {
  60088   poly128_t __ret;
  60089   __ret = (poly128_t)(__p0);
  60090   return __ret;
  60091 }
  60092 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u32(uint32x4_t __p0) {
  60093   poly128_t __ret;
  60094   __ret = (poly128_t)(__p0);
  60095   return __ret;
  60096 }
  60097 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u64(uint64x2_t __p0) {
  60098   poly128_t __ret;
  60099   __ret = (poly128_t)(__p0);
  60100   return __ret;
  60101 }
  60102 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u16(uint16x8_t __p0) {
  60103   poly128_t __ret;
  60104   __ret = (poly128_t)(__p0);
  60105   return __ret;
  60106 }
  60107 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s8(int8x16_t __p0) {
  60108   poly128_t __ret;
  60109   __ret = (poly128_t)(__p0);
  60110   return __ret;
  60111 }
  60112 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_f64(float64x2_t __p0) {
  60113   poly128_t __ret;
  60114   __ret = (poly128_t)(__p0);
  60115   return __ret;
  60116 }
  60117 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_f32(float32x4_t __p0) {
  60118   poly128_t __ret;
  60119   __ret = (poly128_t)(__p0);
  60120   return __ret;
  60121 }
  60122 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_f16(float16x8_t __p0) {
  60123   poly128_t __ret;
  60124   __ret = (poly128_t)(__p0);
  60125   return __ret;
  60126 }
  60127 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s32(int32x4_t __p0) {
  60128   poly128_t __ret;
  60129   __ret = (poly128_t)(__p0);
  60130   return __ret;
  60131 }
  60132 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s64(int64x2_t __p0) {
  60133   poly128_t __ret;
  60134   __ret = (poly128_t)(__p0);
  60135   return __ret;
  60136 }
  60137 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_mf8(mfloat8x16_t __p0) {
  60138   poly128_t __ret;
  60139   __ret = (poly128_t)(__p0);
  60140   return __ret;
  60141 }
  60142 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s16(int16x8_t __p0) {
  60143   poly128_t __ret;
  60144   __ret = (poly128_t)(__p0);
  60145   return __ret;
  60146 }
  60147 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_p8(poly8x16_t __p0) {
  60148   poly64x2_t __ret;
  60149   __ret = (poly64x2_t)(__p0);
  60150   return __ret;
  60151 }
  60152 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_p128(poly128_t __p0) {
  60153   poly64x2_t __ret;
  60154   __ret = (poly64x2_t)(__p0);
  60155   return __ret;
  60156 }
  60157 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_p16(poly16x8_t __p0) {
  60158   poly64x2_t __ret;
  60159   __ret = (poly64x2_t)(__p0);
  60160   return __ret;
  60161 }
  60162 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u8(uint8x16_t __p0) {
  60163   poly64x2_t __ret;
  60164   __ret = (poly64x2_t)(__p0);
  60165   return __ret;
  60166 }
  60167 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u32(uint32x4_t __p0) {
  60168   poly64x2_t __ret;
  60169   __ret = (poly64x2_t)(__p0);
  60170   return __ret;
  60171 }
  60172 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u64(uint64x2_t __p0) {
  60173   poly64x2_t __ret;
  60174   __ret = (poly64x2_t)(__p0);
  60175   return __ret;
  60176 }
  60177 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u16(uint16x8_t __p0) {
  60178   poly64x2_t __ret;
  60179   __ret = (poly64x2_t)(__p0);
  60180   return __ret;
  60181 }
  60182 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s8(int8x16_t __p0) {
  60183   poly64x2_t __ret;
  60184   __ret = (poly64x2_t)(__p0);
  60185   return __ret;
  60186 }
  60187 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_f64(float64x2_t __p0) {
  60188   poly64x2_t __ret;
  60189   __ret = (poly64x2_t)(__p0);
  60190   return __ret;
  60191 }
  60192 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_f32(float32x4_t __p0) {
  60193   poly64x2_t __ret;
  60194   __ret = (poly64x2_t)(__p0);
  60195   return __ret;
  60196 }
  60197 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_f16(float16x8_t __p0) {
  60198   poly64x2_t __ret;
  60199   __ret = (poly64x2_t)(__p0);
  60200   return __ret;
  60201 }
  60202 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s32(int32x4_t __p0) {
  60203   poly64x2_t __ret;
  60204   __ret = (poly64x2_t)(__p0);
  60205   return __ret;
  60206 }
  60207 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s64(int64x2_t __p0) {
  60208   poly64x2_t __ret;
  60209   __ret = (poly64x2_t)(__p0);
  60210   return __ret;
  60211 }
  60212 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_mf8(mfloat8x16_t __p0) {
  60213   poly64x2_t __ret;
  60214   __ret = (poly64x2_t)(__p0);
  60215   return __ret;
  60216 }
  60217 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s16(int16x8_t __p0) {
  60218   poly64x2_t __ret;
  60219   __ret = (poly64x2_t)(__p0);
  60220   return __ret;
  60221 }
  60222 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p8(poly8x16_t __p0) {
  60223   poly16x8_t __ret;
  60224   __ret = (poly16x8_t)(__p0);
  60225   return __ret;
  60226 }
  60227 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p128(poly128_t __p0) {
  60228   poly16x8_t __ret;
  60229   __ret = (poly16x8_t)(__p0);
  60230   return __ret;
  60231 }
  60232 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p64(poly64x2_t __p0) {
  60233   poly16x8_t __ret;
  60234   __ret = (poly16x8_t)(__p0);
  60235   return __ret;
  60236 }
  60237 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u8(uint8x16_t __p0) {
  60238   poly16x8_t __ret;
  60239   __ret = (poly16x8_t)(__p0);
  60240   return __ret;
  60241 }
  60242 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u32(uint32x4_t __p0) {
  60243   poly16x8_t __ret;
  60244   __ret = (poly16x8_t)(__p0);
  60245   return __ret;
  60246 }
  60247 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u64(uint64x2_t __p0) {
  60248   poly16x8_t __ret;
  60249   __ret = (poly16x8_t)(__p0);
  60250   return __ret;
  60251 }
  60252 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u16(uint16x8_t __p0) {
  60253   poly16x8_t __ret;
  60254   __ret = (poly16x8_t)(__p0);
  60255   return __ret;
  60256 }
  60257 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s8(int8x16_t __p0) {
  60258   poly16x8_t __ret;
  60259   __ret = (poly16x8_t)(__p0);
  60260   return __ret;
  60261 }
  60262 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f64(float64x2_t __p0) {
  60263   poly16x8_t __ret;
  60264   __ret = (poly16x8_t)(__p0);
  60265   return __ret;
  60266 }
  60267 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f32(float32x4_t __p0) {
  60268   poly16x8_t __ret;
  60269   __ret = (poly16x8_t)(__p0);
  60270   return __ret;
  60271 }
  60272 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f16(float16x8_t __p0) {
  60273   poly16x8_t __ret;
  60274   __ret = (poly16x8_t)(__p0);
  60275   return __ret;
  60276 }
  60277 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s32(int32x4_t __p0) {
  60278   poly16x8_t __ret;
  60279   __ret = (poly16x8_t)(__p0);
  60280   return __ret;
  60281 }
  60282 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s64(int64x2_t __p0) {
  60283   poly16x8_t __ret;
  60284   __ret = (poly16x8_t)(__p0);
  60285   return __ret;
  60286 }
  60287 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_mf8(mfloat8x16_t __p0) {
  60288   poly16x8_t __ret;
  60289   __ret = (poly16x8_t)(__p0);
  60290   return __ret;
  60291 }
  60292 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s16(int16x8_t __p0) {
  60293   poly16x8_t __ret;
  60294   __ret = (poly16x8_t)(__p0);
  60295   return __ret;
  60296 }
  60297 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p8(poly8x16_t __p0) {
  60298   uint8x16_t __ret;
  60299   __ret = (uint8x16_t)(__p0);
  60300   return __ret;
  60301 }
  60302 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p128(poly128_t __p0) {
  60303   uint8x16_t __ret;
  60304   __ret = (uint8x16_t)(__p0);
  60305   return __ret;
  60306 }
  60307 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p64(poly64x2_t __p0) {
  60308   uint8x16_t __ret;
  60309   __ret = (uint8x16_t)(__p0);
  60310   return __ret;
  60311 }
  60312 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p16(poly16x8_t __p0) {
  60313   uint8x16_t __ret;
  60314   __ret = (uint8x16_t)(__p0);
  60315   return __ret;
  60316 }
  60317 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u32(uint32x4_t __p0) {
  60318   uint8x16_t __ret;
  60319   __ret = (uint8x16_t)(__p0);
  60320   return __ret;
  60321 }
  60322 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u64(uint64x2_t __p0) {
  60323   uint8x16_t __ret;
  60324   __ret = (uint8x16_t)(__p0);
  60325   return __ret;
  60326 }
  60327 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u16(uint16x8_t __p0) {
  60328   uint8x16_t __ret;
  60329   __ret = (uint8x16_t)(__p0);
  60330   return __ret;
  60331 }
  60332 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s8(int8x16_t __p0) {
  60333   uint8x16_t __ret;
  60334   __ret = (uint8x16_t)(__p0);
  60335   return __ret;
  60336 }
  60337 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f64(float64x2_t __p0) {
  60338   uint8x16_t __ret;
  60339   __ret = (uint8x16_t)(__p0);
  60340   return __ret;
  60341 }
  60342 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f32(float32x4_t __p0) {
  60343   uint8x16_t __ret;
  60344   __ret = (uint8x16_t)(__p0);
  60345   return __ret;
  60346 }
  60347 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f16(float16x8_t __p0) {
  60348   uint8x16_t __ret;
  60349   __ret = (uint8x16_t)(__p0);
  60350   return __ret;
  60351 }
  60352 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s32(int32x4_t __p0) {
  60353   uint8x16_t __ret;
  60354   __ret = (uint8x16_t)(__p0);
  60355   return __ret;
  60356 }
  60357 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s64(int64x2_t __p0) {
  60358   uint8x16_t __ret;
  60359   __ret = (uint8x16_t)(__p0);
  60360   return __ret;
  60361 }
  60362 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_mf8(mfloat8x16_t __p0) {
  60363   uint8x16_t __ret;
  60364   __ret = (uint8x16_t)(__p0);
  60365   return __ret;
  60366 }
  60367 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s16(int16x8_t __p0) {
  60368   uint8x16_t __ret;
  60369   __ret = (uint8x16_t)(__p0);
  60370   return __ret;
  60371 }
  60372 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p8(poly8x16_t __p0) {
  60373   uint32x4_t __ret;
  60374   __ret = (uint32x4_t)(__p0);
  60375   return __ret;
  60376 }
  60377 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p128(poly128_t __p0) {
  60378   uint32x4_t __ret;
  60379   __ret = (uint32x4_t)(__p0);
  60380   return __ret;
  60381 }
  60382 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p64(poly64x2_t __p0) {
  60383   uint32x4_t __ret;
  60384   __ret = (uint32x4_t)(__p0);
  60385   return __ret;
  60386 }
  60387 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p16(poly16x8_t __p0) {
  60388   uint32x4_t __ret;
  60389   __ret = (uint32x4_t)(__p0);
  60390   return __ret;
  60391 }
  60392 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u8(uint8x16_t __p0) {
  60393   uint32x4_t __ret;
  60394   __ret = (uint32x4_t)(__p0);
  60395   return __ret;
  60396 }
  60397 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u64(uint64x2_t __p0) {
  60398   uint32x4_t __ret;
  60399   __ret = (uint32x4_t)(__p0);
  60400   return __ret;
  60401 }
  60402 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u16(uint16x8_t __p0) {
  60403   uint32x4_t __ret;
  60404   __ret = (uint32x4_t)(__p0);
  60405   return __ret;
  60406 }
  60407 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s8(int8x16_t __p0) {
  60408   uint32x4_t __ret;
  60409   __ret = (uint32x4_t)(__p0);
  60410   return __ret;
  60411 }
  60412 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f64(float64x2_t __p0) {
  60413   uint32x4_t __ret;
  60414   __ret = (uint32x4_t)(__p0);
  60415   return __ret;
  60416 }
  60417 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f32(float32x4_t __p0) {
  60418   uint32x4_t __ret;
  60419   __ret = (uint32x4_t)(__p0);
  60420   return __ret;
  60421 }
  60422 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f16(float16x8_t __p0) {
  60423   uint32x4_t __ret;
  60424   __ret = (uint32x4_t)(__p0);
  60425   return __ret;
  60426 }
  60427 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s32(int32x4_t __p0) {
  60428   uint32x4_t __ret;
  60429   __ret = (uint32x4_t)(__p0);
  60430   return __ret;
  60431 }
  60432 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s64(int64x2_t __p0) {
  60433   uint32x4_t __ret;
  60434   __ret = (uint32x4_t)(__p0);
  60435   return __ret;
  60436 }
  60437 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_mf8(mfloat8x16_t __p0) {
  60438   uint32x4_t __ret;
  60439   __ret = (uint32x4_t)(__p0);
  60440   return __ret;
  60441 }
  60442 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s16(int16x8_t __p0) {
  60443   uint32x4_t __ret;
  60444   __ret = (uint32x4_t)(__p0);
  60445   return __ret;
  60446 }
  60447 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p8(poly8x16_t __p0) {
  60448   uint64x2_t __ret;
  60449   __ret = (uint64x2_t)(__p0);
  60450   return __ret;
  60451 }
  60452 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p128(poly128_t __p0) {
  60453   uint64x2_t __ret;
  60454   __ret = (uint64x2_t)(__p0);
  60455   return __ret;
  60456 }
  60457 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p64(poly64x2_t __p0) {
  60458   uint64x2_t __ret;
  60459   __ret = (uint64x2_t)(__p0);
  60460   return __ret;
  60461 }
  60462 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p16(poly16x8_t __p0) {
  60463   uint64x2_t __ret;
  60464   __ret = (uint64x2_t)(__p0);
  60465   return __ret;
  60466 }
  60467 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u8(uint8x16_t __p0) {
  60468   uint64x2_t __ret;
  60469   __ret = (uint64x2_t)(__p0);
  60470   return __ret;
  60471 }
  60472 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u32(uint32x4_t __p0) {
  60473   uint64x2_t __ret;
  60474   __ret = (uint64x2_t)(__p0);
  60475   return __ret;
  60476 }
  60477 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u16(uint16x8_t __p0) {
  60478   uint64x2_t __ret;
  60479   __ret = (uint64x2_t)(__p0);
  60480   return __ret;
  60481 }
  60482 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s8(int8x16_t __p0) {
  60483   uint64x2_t __ret;
  60484   __ret = (uint64x2_t)(__p0);
  60485   return __ret;
  60486 }
  60487 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f64(float64x2_t __p0) {
  60488   uint64x2_t __ret;
  60489   __ret = (uint64x2_t)(__p0);
  60490   return __ret;
  60491 }
  60492 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f32(float32x4_t __p0) {
  60493   uint64x2_t __ret;
  60494   __ret = (uint64x2_t)(__p0);
  60495   return __ret;
  60496 }
  60497 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f16(float16x8_t __p0) {
  60498   uint64x2_t __ret;
  60499   __ret = (uint64x2_t)(__p0);
  60500   return __ret;
  60501 }
  60502 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s32(int32x4_t __p0) {
  60503   uint64x2_t __ret;
  60504   __ret = (uint64x2_t)(__p0);
  60505   return __ret;
  60506 }
  60507 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s64(int64x2_t __p0) {
  60508   uint64x2_t __ret;
  60509   __ret = (uint64x2_t)(__p0);
  60510   return __ret;
  60511 }
  60512 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_mf8(mfloat8x16_t __p0) {
  60513   uint64x2_t __ret;
  60514   __ret = (uint64x2_t)(__p0);
  60515   return __ret;
  60516 }
  60517 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s16(int16x8_t __p0) {
  60518   uint64x2_t __ret;
  60519   __ret = (uint64x2_t)(__p0);
  60520   return __ret;
  60521 }
  60522 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p8(poly8x16_t __p0) {
  60523   uint16x8_t __ret;
  60524   __ret = (uint16x8_t)(__p0);
  60525   return __ret;
  60526 }
  60527 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p128(poly128_t __p0) {
  60528   uint16x8_t __ret;
  60529   __ret = (uint16x8_t)(__p0);
  60530   return __ret;
  60531 }
  60532 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p64(poly64x2_t __p0) {
  60533   uint16x8_t __ret;
  60534   __ret = (uint16x8_t)(__p0);
  60535   return __ret;
  60536 }
  60537 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p16(poly16x8_t __p0) {
  60538   uint16x8_t __ret;
  60539   __ret = (uint16x8_t)(__p0);
  60540   return __ret;
  60541 }
  60542 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u8(uint8x16_t __p0) {
  60543   uint16x8_t __ret;
  60544   __ret = (uint16x8_t)(__p0);
  60545   return __ret;
  60546 }
  60547 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u32(uint32x4_t __p0) {
  60548   uint16x8_t __ret;
  60549   __ret = (uint16x8_t)(__p0);
  60550   return __ret;
  60551 }
  60552 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u64(uint64x2_t __p0) {
  60553   uint16x8_t __ret;
  60554   __ret = (uint16x8_t)(__p0);
  60555   return __ret;
  60556 }
  60557 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s8(int8x16_t __p0) {
  60558   uint16x8_t __ret;
  60559   __ret = (uint16x8_t)(__p0);
  60560   return __ret;
  60561 }
  60562 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f64(float64x2_t __p0) {
  60563   uint16x8_t __ret;
  60564   __ret = (uint16x8_t)(__p0);
  60565   return __ret;
  60566 }
  60567 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f32(float32x4_t __p0) {
  60568   uint16x8_t __ret;
  60569   __ret = (uint16x8_t)(__p0);
  60570   return __ret;
  60571 }
  60572 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f16(float16x8_t __p0) {
  60573   uint16x8_t __ret;
  60574   __ret = (uint16x8_t)(__p0);
  60575   return __ret;
  60576 }
  60577 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s32(int32x4_t __p0) {
  60578   uint16x8_t __ret;
  60579   __ret = (uint16x8_t)(__p0);
  60580   return __ret;
  60581 }
  60582 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s64(int64x2_t __p0) {
  60583   uint16x8_t __ret;
  60584   __ret = (uint16x8_t)(__p0);
  60585   return __ret;
  60586 }
  60587 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_mf8(mfloat8x16_t __p0) {
  60588   uint16x8_t __ret;
  60589   __ret = (uint16x8_t)(__p0);
  60590   return __ret;
  60591 }
  60592 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s16(int16x8_t __p0) {
  60593   uint16x8_t __ret;
  60594   __ret = (uint16x8_t)(__p0);
  60595   return __ret;
  60596 }
  60597 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p8(poly8x16_t __p0) {
  60598   int8x16_t __ret;
  60599   __ret = (int8x16_t)(__p0);
  60600   return __ret;
  60601 }
  60602 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p128(poly128_t __p0) {
  60603   int8x16_t __ret;
  60604   __ret = (int8x16_t)(__p0);
  60605   return __ret;
  60606 }
  60607 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p64(poly64x2_t __p0) {
  60608   int8x16_t __ret;
  60609   __ret = (int8x16_t)(__p0);
  60610   return __ret;
  60611 }
  60612 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p16(poly16x8_t __p0) {
  60613   int8x16_t __ret;
  60614   __ret = (int8x16_t)(__p0);
  60615   return __ret;
  60616 }
  60617 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u8(uint8x16_t __p0) {
  60618   int8x16_t __ret;
  60619   __ret = (int8x16_t)(__p0);
  60620   return __ret;
  60621 }
  60622 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u32(uint32x4_t __p0) {
  60623   int8x16_t __ret;
  60624   __ret = (int8x16_t)(__p0);
  60625   return __ret;
  60626 }
  60627 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u64(uint64x2_t __p0) {
  60628   int8x16_t __ret;
  60629   __ret = (int8x16_t)(__p0);
  60630   return __ret;
  60631 }
  60632 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u16(uint16x8_t __p0) {
  60633   int8x16_t __ret;
  60634   __ret = (int8x16_t)(__p0);
  60635   return __ret;
  60636 }
  60637 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f64(float64x2_t __p0) {
  60638   int8x16_t __ret;
  60639   __ret = (int8x16_t)(__p0);
  60640   return __ret;
  60641 }
  60642 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f32(float32x4_t __p0) {
  60643   int8x16_t __ret;
  60644   __ret = (int8x16_t)(__p0);
  60645   return __ret;
  60646 }
  60647 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f16(float16x8_t __p0) {
  60648   int8x16_t __ret;
  60649   __ret = (int8x16_t)(__p0);
  60650   return __ret;
  60651 }
  60652 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s32(int32x4_t __p0) {
  60653   int8x16_t __ret;
  60654   __ret = (int8x16_t)(__p0);
  60655   return __ret;
  60656 }
  60657 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s64(int64x2_t __p0) {
  60658   int8x16_t __ret;
  60659   __ret = (int8x16_t)(__p0);
  60660   return __ret;
  60661 }
  60662 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_mf8(mfloat8x16_t __p0) {
  60663   int8x16_t __ret;
  60664   __ret = (int8x16_t)(__p0);
  60665   return __ret;
  60666 }
  60667 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s16(int16x8_t __p0) {
  60668   int8x16_t __ret;
  60669   __ret = (int8x16_t)(__p0);
  60670   return __ret;
  60671 }
  60672 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p8(poly8x16_t __p0) {
  60673   float64x2_t __ret;
  60674   __ret = (float64x2_t)(__p0);
  60675   return __ret;
  60676 }
  60677 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p128(poly128_t __p0) {
  60678   float64x2_t __ret;
  60679   __ret = (float64x2_t)(__p0);
  60680   return __ret;
  60681 }
  60682 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p64(poly64x2_t __p0) {
  60683   float64x2_t __ret;
  60684   __ret = (float64x2_t)(__p0);
  60685   return __ret;
  60686 }
  60687 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p16(poly16x8_t __p0) {
  60688   float64x2_t __ret;
  60689   __ret = (float64x2_t)(__p0);
  60690   return __ret;
  60691 }
  60692 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u8(uint8x16_t __p0) {
  60693   float64x2_t __ret;
  60694   __ret = (float64x2_t)(__p0);
  60695   return __ret;
  60696 }
  60697 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u32(uint32x4_t __p0) {
  60698   float64x2_t __ret;
  60699   __ret = (float64x2_t)(__p0);
  60700   return __ret;
  60701 }
  60702 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u64(uint64x2_t __p0) {
  60703   float64x2_t __ret;
  60704   __ret = (float64x2_t)(__p0);
  60705   return __ret;
  60706 }
  60707 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u16(uint16x8_t __p0) {
  60708   float64x2_t __ret;
  60709   __ret = (float64x2_t)(__p0);
  60710   return __ret;
  60711 }
  60712 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s8(int8x16_t __p0) {
  60713   float64x2_t __ret;
  60714   __ret = (float64x2_t)(__p0);
  60715   return __ret;
  60716 }
  60717 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_f32(float32x4_t __p0) {
  60718   float64x2_t __ret;
  60719   __ret = (float64x2_t)(__p0);
  60720   return __ret;
  60721 }
  60722 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_f16(float16x8_t __p0) {
  60723   float64x2_t __ret;
  60724   __ret = (float64x2_t)(__p0);
  60725   return __ret;
  60726 }
  60727 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s32(int32x4_t __p0) {
  60728   float64x2_t __ret;
  60729   __ret = (float64x2_t)(__p0);
  60730   return __ret;
  60731 }
  60732 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s64(int64x2_t __p0) {
  60733   float64x2_t __ret;
  60734   __ret = (float64x2_t)(__p0);
  60735   return __ret;
  60736 }
  60737 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_mf8(mfloat8x16_t __p0) {
  60738   float64x2_t __ret;
  60739   __ret = (float64x2_t)(__p0);
  60740   return __ret;
  60741 }
  60742 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s16(int16x8_t __p0) {
  60743   float64x2_t __ret;
  60744   __ret = (float64x2_t)(__p0);
  60745   return __ret;
  60746 }
  60747 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p8(poly8x16_t __p0) {
  60748   float32x4_t __ret;
  60749   __ret = (float32x4_t)(__p0);
  60750   return __ret;
  60751 }
  60752 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p128(poly128_t __p0) {
  60753   float32x4_t __ret;
  60754   __ret = (float32x4_t)(__p0);
  60755   return __ret;
  60756 }
  60757 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p64(poly64x2_t __p0) {
  60758   float32x4_t __ret;
  60759   __ret = (float32x4_t)(__p0);
  60760   return __ret;
  60761 }
  60762 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p16(poly16x8_t __p0) {
  60763   float32x4_t __ret;
  60764   __ret = (float32x4_t)(__p0);
  60765   return __ret;
  60766 }
  60767 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u8(uint8x16_t __p0) {
  60768   float32x4_t __ret;
  60769   __ret = (float32x4_t)(__p0);
  60770   return __ret;
  60771 }
  60772 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u32(uint32x4_t __p0) {
  60773   float32x4_t __ret;
  60774   __ret = (float32x4_t)(__p0);
  60775   return __ret;
  60776 }
  60777 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u64(uint64x2_t __p0) {
  60778   float32x4_t __ret;
  60779   __ret = (float32x4_t)(__p0);
  60780   return __ret;
  60781 }
  60782 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u16(uint16x8_t __p0) {
  60783   float32x4_t __ret;
  60784   __ret = (float32x4_t)(__p0);
  60785   return __ret;
  60786 }
  60787 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s8(int8x16_t __p0) {
  60788   float32x4_t __ret;
  60789   __ret = (float32x4_t)(__p0);
  60790   return __ret;
  60791 }
  60792 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_f64(float64x2_t __p0) {
  60793   float32x4_t __ret;
  60794   __ret = (float32x4_t)(__p0);
  60795   return __ret;
  60796 }
  60797 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_f16(float16x8_t __p0) {
  60798   float32x4_t __ret;
  60799   __ret = (float32x4_t)(__p0);
  60800   return __ret;
  60801 }
  60802 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s32(int32x4_t __p0) {
  60803   float32x4_t __ret;
  60804   __ret = (float32x4_t)(__p0);
  60805   return __ret;
  60806 }
  60807 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s64(int64x2_t __p0) {
  60808   float32x4_t __ret;
  60809   __ret = (float32x4_t)(__p0);
  60810   return __ret;
  60811 }
  60812 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_mf8(mfloat8x16_t __p0) {
  60813   float32x4_t __ret;
  60814   __ret = (float32x4_t)(__p0);
  60815   return __ret;
  60816 }
  60817 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s16(int16x8_t __p0) {
  60818   float32x4_t __ret;
  60819   __ret = (float32x4_t)(__p0);
  60820   return __ret;
  60821 }
  60822 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p8(poly8x16_t __p0) {
  60823   float16x8_t __ret;
  60824   __ret = (float16x8_t)(__p0);
  60825   return __ret;
  60826 }
  60827 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p128(poly128_t __p0) {
  60828   float16x8_t __ret;
  60829   __ret = (float16x8_t)(__p0);
  60830   return __ret;
  60831 }
  60832 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p64(poly64x2_t __p0) {
  60833   float16x8_t __ret;
  60834   __ret = (float16x8_t)(__p0);
  60835   return __ret;
  60836 }
  60837 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p16(poly16x8_t __p0) {
  60838   float16x8_t __ret;
  60839   __ret = (float16x8_t)(__p0);
  60840   return __ret;
  60841 }
  60842 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u8(uint8x16_t __p0) {
  60843   float16x8_t __ret;
  60844   __ret = (float16x8_t)(__p0);
  60845   return __ret;
  60846 }
  60847 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u32(uint32x4_t __p0) {
  60848   float16x8_t __ret;
  60849   __ret = (float16x8_t)(__p0);
  60850   return __ret;
  60851 }
  60852 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u64(uint64x2_t __p0) {
  60853   float16x8_t __ret;
  60854   __ret = (float16x8_t)(__p0);
  60855   return __ret;
  60856 }
  60857 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u16(uint16x8_t __p0) {
  60858   float16x8_t __ret;
  60859   __ret = (float16x8_t)(__p0);
  60860   return __ret;
  60861 }
  60862 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s8(int8x16_t __p0) {
  60863   float16x8_t __ret;
  60864   __ret = (float16x8_t)(__p0);
  60865   return __ret;
  60866 }
  60867 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_f64(float64x2_t __p0) {
  60868   float16x8_t __ret;
  60869   __ret = (float16x8_t)(__p0);
  60870   return __ret;
  60871 }
  60872 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_f32(float32x4_t __p0) {
  60873   float16x8_t __ret;
  60874   __ret = (float16x8_t)(__p0);
  60875   return __ret;
  60876 }
  60877 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s32(int32x4_t __p0) {
  60878   float16x8_t __ret;
  60879   __ret = (float16x8_t)(__p0);
  60880   return __ret;
  60881 }
  60882 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s64(int64x2_t __p0) {
  60883   float16x8_t __ret;
  60884   __ret = (float16x8_t)(__p0);
  60885   return __ret;
  60886 }
  60887 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_mf8(mfloat8x16_t __p0) {
  60888   float16x8_t __ret;
  60889   __ret = (float16x8_t)(__p0);
  60890   return __ret;
  60891 }
  60892 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s16(int16x8_t __p0) {
  60893   float16x8_t __ret;
  60894   __ret = (float16x8_t)(__p0);
  60895   return __ret;
  60896 }
  60897 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p8(poly8x16_t __p0) {
  60898   int32x4_t __ret;
  60899   __ret = (int32x4_t)(__p0);
  60900   return __ret;
  60901 }
  60902 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p128(poly128_t __p0) {
  60903   int32x4_t __ret;
  60904   __ret = (int32x4_t)(__p0);
  60905   return __ret;
  60906 }
  60907 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p64(poly64x2_t __p0) {
  60908   int32x4_t __ret;
  60909   __ret = (int32x4_t)(__p0);
  60910   return __ret;
  60911 }
  60912 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p16(poly16x8_t __p0) {
  60913   int32x4_t __ret;
  60914   __ret = (int32x4_t)(__p0);
  60915   return __ret;
  60916 }
  60917 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u8(uint8x16_t __p0) {
  60918   int32x4_t __ret;
  60919   __ret = (int32x4_t)(__p0);
  60920   return __ret;
  60921 }
  60922 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u32(uint32x4_t __p0) {
  60923   int32x4_t __ret;
  60924   __ret = (int32x4_t)(__p0);
  60925   return __ret;
  60926 }
  60927 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u64(uint64x2_t __p0) {
  60928   int32x4_t __ret;
  60929   __ret = (int32x4_t)(__p0);
  60930   return __ret;
  60931 }
  60932 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u16(uint16x8_t __p0) {
  60933   int32x4_t __ret;
  60934   __ret = (int32x4_t)(__p0);
  60935   return __ret;
  60936 }
  60937 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s8(int8x16_t __p0) {
  60938   int32x4_t __ret;
  60939   __ret = (int32x4_t)(__p0);
  60940   return __ret;
  60941 }
  60942 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f64(float64x2_t __p0) {
  60943   int32x4_t __ret;
  60944   __ret = (int32x4_t)(__p0);
  60945   return __ret;
  60946 }
  60947 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f32(float32x4_t __p0) {
  60948   int32x4_t __ret;
  60949   __ret = (int32x4_t)(__p0);
  60950   return __ret;
  60951 }
  60952 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f16(float16x8_t __p0) {
  60953   int32x4_t __ret;
  60954   __ret = (int32x4_t)(__p0);
  60955   return __ret;
  60956 }
  60957 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s64(int64x2_t __p0) {
  60958   int32x4_t __ret;
  60959   __ret = (int32x4_t)(__p0);
  60960   return __ret;
  60961 }
  60962 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_mf8(mfloat8x16_t __p0) {
  60963   int32x4_t __ret;
  60964   __ret = (int32x4_t)(__p0);
  60965   return __ret;
  60966 }
  60967 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s16(int16x8_t __p0) {
  60968   int32x4_t __ret;
  60969   __ret = (int32x4_t)(__p0);
  60970   return __ret;
  60971 }
  60972 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p8(poly8x16_t __p0) {
  60973   int64x2_t __ret;
  60974   __ret = (int64x2_t)(__p0);
  60975   return __ret;
  60976 }
  60977 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p128(poly128_t __p0) {
  60978   int64x2_t __ret;
  60979   __ret = (int64x2_t)(__p0);
  60980   return __ret;
  60981 }
  60982 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p64(poly64x2_t __p0) {
  60983   int64x2_t __ret;
  60984   __ret = (int64x2_t)(__p0);
  60985   return __ret;
  60986 }
  60987 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p16(poly16x8_t __p0) {
  60988   int64x2_t __ret;
  60989   __ret = (int64x2_t)(__p0);
  60990   return __ret;
  60991 }
  60992 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u8(uint8x16_t __p0) {
  60993   int64x2_t __ret;
  60994   __ret = (int64x2_t)(__p0);
  60995   return __ret;
  60996 }
  60997 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u32(uint32x4_t __p0) {
  60998   int64x2_t __ret;
  60999   __ret = (int64x2_t)(__p0);
  61000   return __ret;
  61001 }
  61002 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u64(uint64x2_t __p0) {
  61003   int64x2_t __ret;
  61004   __ret = (int64x2_t)(__p0);
  61005   return __ret;
  61006 }
  61007 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u16(uint16x8_t __p0) {
  61008   int64x2_t __ret;
  61009   __ret = (int64x2_t)(__p0);
  61010   return __ret;
  61011 }
  61012 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s8(int8x16_t __p0) {
  61013   int64x2_t __ret;
  61014   __ret = (int64x2_t)(__p0);
  61015   return __ret;
  61016 }
  61017 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f64(float64x2_t __p0) {
  61018   int64x2_t __ret;
  61019   __ret = (int64x2_t)(__p0);
  61020   return __ret;
  61021 }
  61022 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f32(float32x4_t __p0) {
  61023   int64x2_t __ret;
  61024   __ret = (int64x2_t)(__p0);
  61025   return __ret;
  61026 }
  61027 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f16(float16x8_t __p0) {
  61028   int64x2_t __ret;
  61029   __ret = (int64x2_t)(__p0);
  61030   return __ret;
  61031 }
  61032 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s32(int32x4_t __p0) {
  61033   int64x2_t __ret;
  61034   __ret = (int64x2_t)(__p0);
  61035   return __ret;
  61036 }
  61037 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_mf8(mfloat8x16_t __p0) {
  61038   int64x2_t __ret;
  61039   __ret = (int64x2_t)(__p0);
  61040   return __ret;
  61041 }
  61042 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s16(int16x8_t __p0) {
  61043   int64x2_t __ret;
  61044   __ret = (int64x2_t)(__p0);
  61045   return __ret;
  61046 }
  61047 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p8(poly8x16_t __p0) {
  61048   mfloat8x16_t __ret;
  61049   __ret = (mfloat8x16_t)(__p0);
  61050   return __ret;
  61051 }
  61052 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p128(poly128_t __p0) {
  61053   mfloat8x16_t __ret;
  61054   __ret = (mfloat8x16_t)(__p0);
  61055   return __ret;
  61056 }
  61057 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p64(poly64x2_t __p0) {
  61058   mfloat8x16_t __ret;
  61059   __ret = (mfloat8x16_t)(__p0);
  61060   return __ret;
  61061 }
  61062 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p16(poly16x8_t __p0) {
  61063   mfloat8x16_t __ret;
  61064   __ret = (mfloat8x16_t)(__p0);
  61065   return __ret;
  61066 }
  61067 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u8(uint8x16_t __p0) {
  61068   mfloat8x16_t __ret;
  61069   __ret = (mfloat8x16_t)(__p0);
  61070   return __ret;
  61071 }
  61072 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u32(uint32x4_t __p0) {
  61073   mfloat8x16_t __ret;
  61074   __ret = (mfloat8x16_t)(__p0);
  61075   return __ret;
  61076 }
  61077 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u64(uint64x2_t __p0) {
  61078   mfloat8x16_t __ret;
  61079   __ret = (mfloat8x16_t)(__p0);
  61080   return __ret;
  61081 }
  61082 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u16(uint16x8_t __p0) {
  61083   mfloat8x16_t __ret;
  61084   __ret = (mfloat8x16_t)(__p0);
  61085   return __ret;
  61086 }
  61087 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s8(int8x16_t __p0) {
  61088   mfloat8x16_t __ret;
  61089   __ret = (mfloat8x16_t)(__p0);
  61090   return __ret;
  61091 }
  61092 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_f64(float64x2_t __p0) {
  61093   mfloat8x16_t __ret;
  61094   __ret = (mfloat8x16_t)(__p0);
  61095   return __ret;
  61096 }
  61097 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_f32(float32x4_t __p0) {
  61098   mfloat8x16_t __ret;
  61099   __ret = (mfloat8x16_t)(__p0);
  61100   return __ret;
  61101 }
  61102 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_f16(float16x8_t __p0) {
  61103   mfloat8x16_t __ret;
  61104   __ret = (mfloat8x16_t)(__p0);
  61105   return __ret;
  61106 }
  61107 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s32(int32x4_t __p0) {
  61108   mfloat8x16_t __ret;
  61109   __ret = (mfloat8x16_t)(__p0);
  61110   return __ret;
  61111 }
  61112 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s64(int64x2_t __p0) {
  61113   mfloat8x16_t __ret;
  61114   __ret = (mfloat8x16_t)(__p0);
  61115   return __ret;
  61116 }
  61117 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s16(int16x8_t __p0) {
  61118   mfloat8x16_t __ret;
  61119   __ret = (mfloat8x16_t)(__p0);
  61120   return __ret;
  61121 }
  61122 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p8(poly8x16_t __p0) {
  61123   int16x8_t __ret;
  61124   __ret = (int16x8_t)(__p0);
  61125   return __ret;
  61126 }
  61127 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p128(poly128_t __p0) {
  61128   int16x8_t __ret;
  61129   __ret = (int16x8_t)(__p0);
  61130   return __ret;
  61131 }
  61132 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p64(poly64x2_t __p0) {
  61133   int16x8_t __ret;
  61134   __ret = (int16x8_t)(__p0);
  61135   return __ret;
  61136 }
  61137 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p16(poly16x8_t __p0) {
  61138   int16x8_t __ret;
  61139   __ret = (int16x8_t)(__p0);
  61140   return __ret;
  61141 }
  61142 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u8(uint8x16_t __p0) {
  61143   int16x8_t __ret;
  61144   __ret = (int16x8_t)(__p0);
  61145   return __ret;
  61146 }
  61147 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u32(uint32x4_t __p0) {
  61148   int16x8_t __ret;
  61149   __ret = (int16x8_t)(__p0);
  61150   return __ret;
  61151 }
  61152 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u64(uint64x2_t __p0) {
  61153   int16x8_t __ret;
  61154   __ret = (int16x8_t)(__p0);
  61155   return __ret;
  61156 }
  61157 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u16(uint16x8_t __p0) {
  61158   int16x8_t __ret;
  61159   __ret = (int16x8_t)(__p0);
  61160   return __ret;
  61161 }
  61162 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s8(int8x16_t __p0) {
  61163   int16x8_t __ret;
  61164   __ret = (int16x8_t)(__p0);
  61165   return __ret;
  61166 }
  61167 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f64(float64x2_t __p0) {
  61168   int16x8_t __ret;
  61169   __ret = (int16x8_t)(__p0);
  61170   return __ret;
  61171 }
  61172 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f32(float32x4_t __p0) {
  61173   int16x8_t __ret;
  61174   __ret = (int16x8_t)(__p0);
  61175   return __ret;
  61176 }
  61177 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f16(float16x8_t __p0) {
  61178   int16x8_t __ret;
  61179   __ret = (int16x8_t)(__p0);
  61180   return __ret;
  61181 }
  61182 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s32(int32x4_t __p0) {
  61183   int16x8_t __ret;
  61184   __ret = (int16x8_t)(__p0);
  61185   return __ret;
  61186 }
  61187 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s64(int64x2_t __p0) {
  61188   int16x8_t __ret;
  61189   __ret = (int16x8_t)(__p0);
  61190   return __ret;
  61191 }
  61192 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_mf8(mfloat8x16_t __p0) {
  61193   int16x8_t __ret;
  61194   __ret = (int16x8_t)(__p0);
  61195   return __ret;
  61196 }
  61197 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p8(poly8x8_t __p0) {
  61198   uint8x8_t __ret;
  61199   __ret = (uint8x8_t)(__p0);
  61200   return __ret;
  61201 }
  61202 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p64(poly64x1_t __p0) {
  61203   uint8x8_t __ret;
  61204   __ret = (uint8x8_t)(__p0);
  61205   return __ret;
  61206 }
  61207 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p16(poly16x4_t __p0) {
  61208   uint8x8_t __ret;
  61209   __ret = (uint8x8_t)(__p0);
  61210   return __ret;
  61211 }
  61212 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u32(uint32x2_t __p0) {
  61213   uint8x8_t __ret;
  61214   __ret = (uint8x8_t)(__p0);
  61215   return __ret;
  61216 }
  61217 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u64(uint64x1_t __p0) {
  61218   uint8x8_t __ret;
  61219   __ret = (uint8x8_t)(__p0);
  61220   return __ret;
  61221 }
  61222 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u16(uint16x4_t __p0) {
  61223   uint8x8_t __ret;
  61224   __ret = (uint8x8_t)(__p0);
  61225   return __ret;
  61226 }
  61227 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s8(int8x8_t __p0) {
  61228   uint8x8_t __ret;
  61229   __ret = (uint8x8_t)(__p0);
  61230   return __ret;
  61231 }
  61232 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f64(float64x1_t __p0) {
  61233   uint8x8_t __ret;
  61234   __ret = (uint8x8_t)(__p0);
  61235   return __ret;
  61236 }
  61237 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f32(float32x2_t __p0) {
  61238   uint8x8_t __ret;
  61239   __ret = (uint8x8_t)(__p0);
  61240   return __ret;
  61241 }
  61242 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f16(float16x4_t __p0) {
  61243   uint8x8_t __ret;
  61244   __ret = (uint8x8_t)(__p0);
  61245   return __ret;
  61246 }
  61247 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s32(int32x2_t __p0) {
  61248   uint8x8_t __ret;
  61249   __ret = (uint8x8_t)(__p0);
  61250   return __ret;
  61251 }
  61252 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s64(int64x1_t __p0) {
  61253   uint8x8_t __ret;
  61254   __ret = (uint8x8_t)(__p0);
  61255   return __ret;
  61256 }
  61257 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_mf8(mfloat8x8_t __p0) {
  61258   uint8x8_t __ret;
  61259   __ret = (uint8x8_t)(__p0);
  61260   return __ret;
  61261 }
  61262 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s16(int16x4_t __p0) {
  61263   uint8x8_t __ret;
  61264   __ret = (uint8x8_t)(__p0);
  61265   return __ret;
  61266 }
  61267 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p8(poly8x8_t __p0) {
  61268   uint32x2_t __ret;
  61269   __ret = (uint32x2_t)(__p0);
  61270   return __ret;
  61271 }
  61272 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p64(poly64x1_t __p0) {
  61273   uint32x2_t __ret;
  61274   __ret = (uint32x2_t)(__p0);
  61275   return __ret;
  61276 }
  61277 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p16(poly16x4_t __p0) {
  61278   uint32x2_t __ret;
  61279   __ret = (uint32x2_t)(__p0);
  61280   return __ret;
  61281 }
  61282 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u8(uint8x8_t __p0) {
  61283   uint32x2_t __ret;
  61284   __ret = (uint32x2_t)(__p0);
  61285   return __ret;
  61286 }
  61287 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u64(uint64x1_t __p0) {
  61288   uint32x2_t __ret;
  61289   __ret = (uint32x2_t)(__p0);
  61290   return __ret;
  61291 }
  61292 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u16(uint16x4_t __p0) {
  61293   uint32x2_t __ret;
  61294   __ret = (uint32x2_t)(__p0);
  61295   return __ret;
  61296 }
  61297 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s8(int8x8_t __p0) {
  61298   uint32x2_t __ret;
  61299   __ret = (uint32x2_t)(__p0);
  61300   return __ret;
  61301 }
  61302 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f64(float64x1_t __p0) {
  61303   uint32x2_t __ret;
  61304   __ret = (uint32x2_t)(__p0);
  61305   return __ret;
  61306 }
  61307 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f32(float32x2_t __p0) {
  61308   uint32x2_t __ret;
  61309   __ret = (uint32x2_t)(__p0);
  61310   return __ret;
  61311 }
  61312 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f16(float16x4_t __p0) {
  61313   uint32x2_t __ret;
  61314   __ret = (uint32x2_t)(__p0);
  61315   return __ret;
  61316 }
  61317 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s32(int32x2_t __p0) {
  61318   uint32x2_t __ret;
  61319   __ret = (uint32x2_t)(__p0);
  61320   return __ret;
  61321 }
  61322 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s64(int64x1_t __p0) {
  61323   uint32x2_t __ret;
  61324   __ret = (uint32x2_t)(__p0);
  61325   return __ret;
  61326 }
  61327 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_mf8(mfloat8x8_t __p0) {
  61328   uint32x2_t __ret;
  61329   __ret = (uint32x2_t)(__p0);
  61330   return __ret;
  61331 }
  61332 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s16(int16x4_t __p0) {
  61333   uint32x2_t __ret;
  61334   __ret = (uint32x2_t)(__p0);
  61335   return __ret;
  61336 }
  61337 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p8(poly8x8_t __p0) {
  61338   uint64x1_t __ret;
  61339   __ret = (uint64x1_t)(__p0);
  61340   return __ret;
  61341 }
  61342 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p64(poly64x1_t __p0) {
  61343   uint64x1_t __ret;
  61344   __ret = (uint64x1_t)(__p0);
  61345   return __ret;
  61346 }
  61347 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p16(poly16x4_t __p0) {
  61348   uint64x1_t __ret;
  61349   __ret = (uint64x1_t)(__p0);
  61350   return __ret;
  61351 }
  61352 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u8(uint8x8_t __p0) {
  61353   uint64x1_t __ret;
  61354   __ret = (uint64x1_t)(__p0);
  61355   return __ret;
  61356 }
  61357 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u32(uint32x2_t __p0) {
  61358   uint64x1_t __ret;
  61359   __ret = (uint64x1_t)(__p0);
  61360   return __ret;
  61361 }
  61362 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u16(uint16x4_t __p0) {
  61363   uint64x1_t __ret;
  61364   __ret = (uint64x1_t)(__p0);
  61365   return __ret;
  61366 }
  61367 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s8(int8x8_t __p0) {
  61368   uint64x1_t __ret;
  61369   __ret = (uint64x1_t)(__p0);
  61370   return __ret;
  61371 }
  61372 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f64(float64x1_t __p0) {
  61373   uint64x1_t __ret;
  61374   __ret = (uint64x1_t)(__p0);
  61375   return __ret;
  61376 }
  61377 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f32(float32x2_t __p0) {
  61378   uint64x1_t __ret;
  61379   __ret = (uint64x1_t)(__p0);
  61380   return __ret;
  61381 }
  61382 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f16(float16x4_t __p0) {
  61383   uint64x1_t __ret;
  61384   __ret = (uint64x1_t)(__p0);
  61385   return __ret;
  61386 }
  61387 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s32(int32x2_t __p0) {
  61388   uint64x1_t __ret;
  61389   __ret = (uint64x1_t)(__p0);
  61390   return __ret;
  61391 }
  61392 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s64(int64x1_t __p0) {
  61393   uint64x1_t __ret;
  61394   __ret = (uint64x1_t)(__p0);
  61395   return __ret;
  61396 }
  61397 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_mf8(mfloat8x8_t __p0) {
  61398   uint64x1_t __ret;
  61399   __ret = (uint64x1_t)(__p0);
  61400   return __ret;
  61401 }
  61402 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s16(int16x4_t __p0) {
  61403   uint64x1_t __ret;
  61404   __ret = (uint64x1_t)(__p0);
  61405   return __ret;
  61406 }
  61407 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p8(poly8x8_t __p0) {
  61408   uint16x4_t __ret;
  61409   __ret = (uint16x4_t)(__p0);
  61410   return __ret;
  61411 }
  61412 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p64(poly64x1_t __p0) {
  61413   uint16x4_t __ret;
  61414   __ret = (uint16x4_t)(__p0);
  61415   return __ret;
  61416 }
  61417 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p16(poly16x4_t __p0) {
  61418   uint16x4_t __ret;
  61419   __ret = (uint16x4_t)(__p0);
  61420   return __ret;
  61421 }
  61422 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u8(uint8x8_t __p0) {
  61423   uint16x4_t __ret;
  61424   __ret = (uint16x4_t)(__p0);
  61425   return __ret;
  61426 }
  61427 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u32(uint32x2_t __p0) {
  61428   uint16x4_t __ret;
  61429   __ret = (uint16x4_t)(__p0);
  61430   return __ret;
  61431 }
  61432 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u64(uint64x1_t __p0) {
  61433   uint16x4_t __ret;
  61434   __ret = (uint16x4_t)(__p0);
  61435   return __ret;
  61436 }
  61437 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s8(int8x8_t __p0) {
  61438   uint16x4_t __ret;
  61439   __ret = (uint16x4_t)(__p0);
  61440   return __ret;
  61441 }
  61442 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f64(float64x1_t __p0) {
  61443   uint16x4_t __ret;
  61444   __ret = (uint16x4_t)(__p0);
  61445   return __ret;
  61446 }
  61447 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f32(float32x2_t __p0) {
  61448   uint16x4_t __ret;
  61449   __ret = (uint16x4_t)(__p0);
  61450   return __ret;
  61451 }
  61452 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f16(float16x4_t __p0) {
  61453   uint16x4_t __ret;
  61454   __ret = (uint16x4_t)(__p0);
  61455   return __ret;
  61456 }
  61457 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s32(int32x2_t __p0) {
  61458   uint16x4_t __ret;
  61459   __ret = (uint16x4_t)(__p0);
  61460   return __ret;
  61461 }
  61462 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s64(int64x1_t __p0) {
  61463   uint16x4_t __ret;
  61464   __ret = (uint16x4_t)(__p0);
  61465   return __ret;
  61466 }
  61467 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_mf8(mfloat8x8_t __p0) {
  61468   uint16x4_t __ret;
  61469   __ret = (uint16x4_t)(__p0);
  61470   return __ret;
  61471 }
  61472 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s16(int16x4_t __p0) {
  61473   uint16x4_t __ret;
  61474   __ret = (uint16x4_t)(__p0);
  61475   return __ret;
  61476 }
  61477 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p8(poly8x8_t __p0) {
  61478   int8x8_t __ret;
  61479   __ret = (int8x8_t)(__p0);
  61480   return __ret;
  61481 }
  61482 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p64(poly64x1_t __p0) {
  61483   int8x8_t __ret;
  61484   __ret = (int8x8_t)(__p0);
  61485   return __ret;
  61486 }
  61487 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p16(poly16x4_t __p0) {
  61488   int8x8_t __ret;
  61489   __ret = (int8x8_t)(__p0);
  61490   return __ret;
  61491 }
  61492 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u8(uint8x8_t __p0) {
  61493   int8x8_t __ret;
  61494   __ret = (int8x8_t)(__p0);
  61495   return __ret;
  61496 }
  61497 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u32(uint32x2_t __p0) {
  61498   int8x8_t __ret;
  61499   __ret = (int8x8_t)(__p0);
  61500   return __ret;
  61501 }
  61502 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u64(uint64x1_t __p0) {
  61503   int8x8_t __ret;
  61504   __ret = (int8x8_t)(__p0);
  61505   return __ret;
  61506 }
  61507 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u16(uint16x4_t __p0) {
  61508   int8x8_t __ret;
  61509   __ret = (int8x8_t)(__p0);
  61510   return __ret;
  61511 }
  61512 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f64(float64x1_t __p0) {
  61513   int8x8_t __ret;
  61514   __ret = (int8x8_t)(__p0);
  61515   return __ret;
  61516 }
  61517 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f32(float32x2_t __p0) {
  61518   int8x8_t __ret;
  61519   __ret = (int8x8_t)(__p0);
  61520   return __ret;
  61521 }
  61522 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f16(float16x4_t __p0) {
  61523   int8x8_t __ret;
  61524   __ret = (int8x8_t)(__p0);
  61525   return __ret;
  61526 }
  61527 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s32(int32x2_t __p0) {
  61528   int8x8_t __ret;
  61529   __ret = (int8x8_t)(__p0);
  61530   return __ret;
  61531 }
  61532 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s64(int64x1_t __p0) {
  61533   int8x8_t __ret;
  61534   __ret = (int8x8_t)(__p0);
  61535   return __ret;
  61536 }
  61537 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_mf8(mfloat8x8_t __p0) {
  61538   int8x8_t __ret;
  61539   __ret = (int8x8_t)(__p0);
  61540   return __ret;
  61541 }
  61542 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s16(int16x4_t __p0) {
  61543   int8x8_t __ret;
  61544   __ret = (int8x8_t)(__p0);
  61545   return __ret;
  61546 }
  61547 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_p8(poly8x8_t __p0) {
  61548   float64x1_t __ret;
  61549   __ret = (float64x1_t)(__p0);
  61550   return __ret;
  61551 }
  61552 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_p64(poly64x1_t __p0) {
  61553   float64x1_t __ret;
  61554   __ret = (float64x1_t)(__p0);
  61555   return __ret;
  61556 }
  61557 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_p16(poly16x4_t __p0) {
  61558   float64x1_t __ret;
  61559   __ret = (float64x1_t)(__p0);
  61560   return __ret;
  61561 }
  61562 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u8(uint8x8_t __p0) {
  61563   float64x1_t __ret;
  61564   __ret = (float64x1_t)(__p0);
  61565   return __ret;
  61566 }
  61567 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u32(uint32x2_t __p0) {
  61568   float64x1_t __ret;
  61569   __ret = (float64x1_t)(__p0);
  61570   return __ret;
  61571 }
  61572 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u64(uint64x1_t __p0) {
  61573   float64x1_t __ret;
  61574   __ret = (float64x1_t)(__p0);
  61575   return __ret;
  61576 }
  61577 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u16(uint16x4_t __p0) {
  61578   float64x1_t __ret;
  61579   __ret = (float64x1_t)(__p0);
  61580   return __ret;
  61581 }
  61582 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s8(int8x8_t __p0) {
  61583   float64x1_t __ret;
  61584   __ret = (float64x1_t)(__p0);
  61585   return __ret;
  61586 }
  61587 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_f32(float32x2_t __p0) {
  61588   float64x1_t __ret;
  61589   __ret = (float64x1_t)(__p0);
  61590   return __ret;
  61591 }
  61592 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_f16(float16x4_t __p0) {
  61593   float64x1_t __ret;
  61594   __ret = (float64x1_t)(__p0);
  61595   return __ret;
  61596 }
  61597 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s32(int32x2_t __p0) {
  61598   float64x1_t __ret;
  61599   __ret = (float64x1_t)(__p0);
  61600   return __ret;
  61601 }
  61602 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s64(int64x1_t __p0) {
  61603   float64x1_t __ret;
  61604   __ret = (float64x1_t)(__p0);
  61605   return __ret;
  61606 }
  61607 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_mf8(mfloat8x8_t __p0) {
  61608   float64x1_t __ret;
  61609   __ret = (float64x1_t)(__p0);
  61610   return __ret;
  61611 }
  61612 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s16(int16x4_t __p0) {
  61613   float64x1_t __ret;
  61614   __ret = (float64x1_t)(__p0);
  61615   return __ret;
  61616 }
  61617 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p8(poly8x8_t __p0) {
  61618   float32x2_t __ret;
  61619   __ret = (float32x2_t)(__p0);
  61620   return __ret;
  61621 }
  61622 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p64(poly64x1_t __p0) {
  61623   float32x2_t __ret;
  61624   __ret = (float32x2_t)(__p0);
  61625   return __ret;
  61626 }
  61627 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p16(poly16x4_t __p0) {
  61628   float32x2_t __ret;
  61629   __ret = (float32x2_t)(__p0);
  61630   return __ret;
  61631 }
  61632 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u8(uint8x8_t __p0) {
  61633   float32x2_t __ret;
  61634   __ret = (float32x2_t)(__p0);
  61635   return __ret;
  61636 }
  61637 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u32(uint32x2_t __p0) {
  61638   float32x2_t __ret;
  61639   __ret = (float32x2_t)(__p0);
  61640   return __ret;
  61641 }
  61642 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u64(uint64x1_t __p0) {
  61643   float32x2_t __ret;
  61644   __ret = (float32x2_t)(__p0);
  61645   return __ret;
  61646 }
  61647 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u16(uint16x4_t __p0) {
  61648   float32x2_t __ret;
  61649   __ret = (float32x2_t)(__p0);
  61650   return __ret;
  61651 }
  61652 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s8(int8x8_t __p0) {
  61653   float32x2_t __ret;
  61654   __ret = (float32x2_t)(__p0);
  61655   return __ret;
  61656 }
  61657 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_f64(float64x1_t __p0) {
  61658   float32x2_t __ret;
  61659   __ret = (float32x2_t)(__p0);
  61660   return __ret;
  61661 }
  61662 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_f16(float16x4_t __p0) {
  61663   float32x2_t __ret;
  61664   __ret = (float32x2_t)(__p0);
  61665   return __ret;
  61666 }
  61667 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s32(int32x2_t __p0) {
  61668   float32x2_t __ret;
  61669   __ret = (float32x2_t)(__p0);
  61670   return __ret;
  61671 }
  61672 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s64(int64x1_t __p0) {
  61673   float32x2_t __ret;
  61674   __ret = (float32x2_t)(__p0);
  61675   return __ret;
  61676 }
  61677 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_mf8(mfloat8x8_t __p0) {
  61678   float32x2_t __ret;
  61679   __ret = (float32x2_t)(__p0);
  61680   return __ret;
  61681 }
  61682 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s16(int16x4_t __p0) {
  61683   float32x2_t __ret;
  61684   __ret = (float32x2_t)(__p0);
  61685   return __ret;
  61686 }
  61687 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p8(poly8x8_t __p0) {
  61688   float16x4_t __ret;
  61689   __ret = (float16x4_t)(__p0);
  61690   return __ret;
  61691 }
  61692 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p64(poly64x1_t __p0) {
  61693   float16x4_t __ret;
  61694   __ret = (float16x4_t)(__p0);
  61695   return __ret;
  61696 }
  61697 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p16(poly16x4_t __p0) {
  61698   float16x4_t __ret;
  61699   __ret = (float16x4_t)(__p0);
  61700   return __ret;
  61701 }
  61702 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u8(uint8x8_t __p0) {
  61703   float16x4_t __ret;
  61704   __ret = (float16x4_t)(__p0);
  61705   return __ret;
  61706 }
  61707 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u32(uint32x2_t __p0) {
  61708   float16x4_t __ret;
  61709   __ret = (float16x4_t)(__p0);
  61710   return __ret;
  61711 }
  61712 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u64(uint64x1_t __p0) {
  61713   float16x4_t __ret;
  61714   __ret = (float16x4_t)(__p0);
  61715   return __ret;
  61716 }
  61717 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u16(uint16x4_t __p0) {
  61718   float16x4_t __ret;
  61719   __ret = (float16x4_t)(__p0);
  61720   return __ret;
  61721 }
  61722 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s8(int8x8_t __p0) {
  61723   float16x4_t __ret;
  61724   __ret = (float16x4_t)(__p0);
  61725   return __ret;
  61726 }
  61727 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_f64(float64x1_t __p0) {
  61728   float16x4_t __ret;
  61729   __ret = (float16x4_t)(__p0);
  61730   return __ret;
  61731 }
  61732 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_f32(float32x2_t __p0) {
  61733   float16x4_t __ret;
  61734   __ret = (float16x4_t)(__p0);
  61735   return __ret;
  61736 }
  61737 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s32(int32x2_t __p0) {
  61738   float16x4_t __ret;
  61739   __ret = (float16x4_t)(__p0);
  61740   return __ret;
  61741 }
  61742 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s64(int64x1_t __p0) {
  61743   float16x4_t __ret;
  61744   __ret = (float16x4_t)(__p0);
  61745   return __ret;
  61746 }
  61747 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_mf8(mfloat8x8_t __p0) {
  61748   float16x4_t __ret;
  61749   __ret = (float16x4_t)(__p0);
  61750   return __ret;
  61751 }
  61752 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s16(int16x4_t __p0) {
  61753   float16x4_t __ret;
  61754   __ret = (float16x4_t)(__p0);
  61755   return __ret;
  61756 }
  61757 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p8(poly8x8_t __p0) {
  61758   int32x2_t __ret;
  61759   __ret = (int32x2_t)(__p0);
  61760   return __ret;
  61761 }
  61762 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p64(poly64x1_t __p0) {
  61763   int32x2_t __ret;
  61764   __ret = (int32x2_t)(__p0);
  61765   return __ret;
  61766 }
  61767 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p16(poly16x4_t __p0) {
  61768   int32x2_t __ret;
  61769   __ret = (int32x2_t)(__p0);
  61770   return __ret;
  61771 }
  61772 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u8(uint8x8_t __p0) {
  61773   int32x2_t __ret;
  61774   __ret = (int32x2_t)(__p0);
  61775   return __ret;
  61776 }
  61777 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u32(uint32x2_t __p0) {
  61778   int32x2_t __ret;
  61779   __ret = (int32x2_t)(__p0);
  61780   return __ret;
  61781 }
  61782 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u64(uint64x1_t __p0) {
  61783   int32x2_t __ret;
  61784   __ret = (int32x2_t)(__p0);
  61785   return __ret;
  61786 }
  61787 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u16(uint16x4_t __p0) {
  61788   int32x2_t __ret;
  61789   __ret = (int32x2_t)(__p0);
  61790   return __ret;
  61791 }
  61792 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s8(int8x8_t __p0) {
  61793   int32x2_t __ret;
  61794   __ret = (int32x2_t)(__p0);
  61795   return __ret;
  61796 }
  61797 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f64(float64x1_t __p0) {
  61798   int32x2_t __ret;
  61799   __ret = (int32x2_t)(__p0);
  61800   return __ret;
  61801 }
  61802 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f32(float32x2_t __p0) {
  61803   int32x2_t __ret;
  61804   __ret = (int32x2_t)(__p0);
  61805   return __ret;
  61806 }
  61807 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f16(float16x4_t __p0) {
  61808   int32x2_t __ret;
  61809   __ret = (int32x2_t)(__p0);
  61810   return __ret;
  61811 }
  61812 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s64(int64x1_t __p0) {
  61813   int32x2_t __ret;
  61814   __ret = (int32x2_t)(__p0);
  61815   return __ret;
  61816 }
  61817 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_mf8(mfloat8x8_t __p0) {
  61818   int32x2_t __ret;
  61819   __ret = (int32x2_t)(__p0);
  61820   return __ret;
  61821 }
  61822 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s16(int16x4_t __p0) {
  61823   int32x2_t __ret;
  61824   __ret = (int32x2_t)(__p0);
  61825   return __ret;
  61826 }
  61827 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p8(poly8x8_t __p0) {
  61828   int64x1_t __ret;
  61829   __ret = (int64x1_t)(__p0);
  61830   return __ret;
  61831 }
  61832 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p64(poly64x1_t __p0) {
  61833   int64x1_t __ret;
  61834   __ret = (int64x1_t)(__p0);
  61835   return __ret;
  61836 }
  61837 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p16(poly16x4_t __p0) {
  61838   int64x1_t __ret;
  61839   __ret = (int64x1_t)(__p0);
  61840   return __ret;
  61841 }
  61842 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u8(uint8x8_t __p0) {
  61843   int64x1_t __ret;
  61844   __ret = (int64x1_t)(__p0);
  61845   return __ret;
  61846 }
  61847 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u32(uint32x2_t __p0) {
  61848   int64x1_t __ret;
  61849   __ret = (int64x1_t)(__p0);
  61850   return __ret;
  61851 }
  61852 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u64(uint64x1_t __p0) {
  61853   int64x1_t __ret;
  61854   __ret = (int64x1_t)(__p0);
  61855   return __ret;
  61856 }
  61857 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u16(uint16x4_t __p0) {
  61858   int64x1_t __ret;
  61859   __ret = (int64x1_t)(__p0);
  61860   return __ret;
  61861 }
  61862 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s8(int8x8_t __p0) {
  61863   int64x1_t __ret;
  61864   __ret = (int64x1_t)(__p0);
  61865   return __ret;
  61866 }
  61867 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f64(float64x1_t __p0) {
  61868   int64x1_t __ret;
  61869   __ret = (int64x1_t)(__p0);
  61870   return __ret;
  61871 }
  61872 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f32(float32x2_t __p0) {
  61873   int64x1_t __ret;
  61874   __ret = (int64x1_t)(__p0);
  61875   return __ret;
  61876 }
  61877 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f16(float16x4_t __p0) {
  61878   int64x1_t __ret;
  61879   __ret = (int64x1_t)(__p0);
  61880   return __ret;
  61881 }
  61882 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s32(int32x2_t __p0) {
  61883   int64x1_t __ret;
  61884   __ret = (int64x1_t)(__p0);
  61885   return __ret;
  61886 }
  61887 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_mf8(mfloat8x8_t __p0) {
  61888   int64x1_t __ret;
  61889   __ret = (int64x1_t)(__p0);
  61890   return __ret;
  61891 }
  61892 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s16(int16x4_t __p0) {
  61893   int64x1_t __ret;
  61894   __ret = (int64x1_t)(__p0);
  61895   return __ret;
  61896 }
  61897 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_p8(poly8x8_t __p0) {
  61898   mfloat8x8_t __ret;
  61899   __ret = (mfloat8x8_t)(__p0);
  61900   return __ret;
  61901 }
  61902 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_p64(poly64x1_t __p0) {
  61903   mfloat8x8_t __ret;
  61904   __ret = (mfloat8x8_t)(__p0);
  61905   return __ret;
  61906 }
  61907 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_p16(poly16x4_t __p0) {
  61908   mfloat8x8_t __ret;
  61909   __ret = (mfloat8x8_t)(__p0);
  61910   return __ret;
  61911 }
  61912 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u8(uint8x8_t __p0) {
  61913   mfloat8x8_t __ret;
  61914   __ret = (mfloat8x8_t)(__p0);
  61915   return __ret;
  61916 }
  61917 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u32(uint32x2_t __p0) {
  61918   mfloat8x8_t __ret;
  61919   __ret = (mfloat8x8_t)(__p0);
  61920   return __ret;
  61921 }
  61922 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u64(uint64x1_t __p0) {
  61923   mfloat8x8_t __ret;
  61924   __ret = (mfloat8x8_t)(__p0);
  61925   return __ret;
  61926 }
  61927 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u16(uint16x4_t __p0) {
  61928   mfloat8x8_t __ret;
  61929   __ret = (mfloat8x8_t)(__p0);
  61930   return __ret;
  61931 }
  61932 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s8(int8x8_t __p0) {
  61933   mfloat8x8_t __ret;
  61934   __ret = (mfloat8x8_t)(__p0);
  61935   return __ret;
  61936 }
  61937 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_f64(float64x1_t __p0) {
  61938   mfloat8x8_t __ret;
  61939   __ret = (mfloat8x8_t)(__p0);
  61940   return __ret;
  61941 }
  61942 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_f32(float32x2_t __p0) {
  61943   mfloat8x8_t __ret;
  61944   __ret = (mfloat8x8_t)(__p0);
  61945   return __ret;
  61946 }
  61947 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_f16(float16x4_t __p0) {
  61948   mfloat8x8_t __ret;
  61949   __ret = (mfloat8x8_t)(__p0);
  61950   return __ret;
  61951 }
  61952 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s32(int32x2_t __p0) {
  61953   mfloat8x8_t __ret;
  61954   __ret = (mfloat8x8_t)(__p0);
  61955   return __ret;
  61956 }
  61957 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s64(int64x1_t __p0) {
  61958   mfloat8x8_t __ret;
  61959   __ret = (mfloat8x8_t)(__p0);
  61960   return __ret;
  61961 }
  61962 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s16(int16x4_t __p0) {
  61963   mfloat8x8_t __ret;
  61964   __ret = (mfloat8x8_t)(__p0);
  61965   return __ret;
  61966 }
  61967 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p8(poly8x8_t __p0) {
  61968   int16x4_t __ret;
  61969   __ret = (int16x4_t)(__p0);
  61970   return __ret;
  61971 }
  61972 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p64(poly64x1_t __p0) {
  61973   int16x4_t __ret;
  61974   __ret = (int16x4_t)(__p0);
  61975   return __ret;
  61976 }
  61977 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p16(poly16x4_t __p0) {
  61978   int16x4_t __ret;
  61979   __ret = (int16x4_t)(__p0);
  61980   return __ret;
  61981 }
  61982 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u8(uint8x8_t __p0) {
  61983   int16x4_t __ret;
  61984   __ret = (int16x4_t)(__p0);
  61985   return __ret;
  61986 }
  61987 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u32(uint32x2_t __p0) {
  61988   int16x4_t __ret;
  61989   __ret = (int16x4_t)(__p0);
  61990   return __ret;
  61991 }
  61992 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u64(uint64x1_t __p0) {
  61993   int16x4_t __ret;
  61994   __ret = (int16x4_t)(__p0);
  61995   return __ret;
  61996 }
  61997 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u16(uint16x4_t __p0) {
  61998   int16x4_t __ret;
  61999   __ret = (int16x4_t)(__p0);
  62000   return __ret;
  62001 }
  62002 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s8(int8x8_t __p0) {
  62003   int16x4_t __ret;
  62004   __ret = (int16x4_t)(__p0);
  62005   return __ret;
  62006 }
  62007 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f64(float64x1_t __p0) {
  62008   int16x4_t __ret;
  62009   __ret = (int16x4_t)(__p0);
  62010   return __ret;
  62011 }
  62012 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f32(float32x2_t __p0) {
  62013   int16x4_t __ret;
  62014   __ret = (int16x4_t)(__p0);
  62015   return __ret;
  62016 }
  62017 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f16(float16x4_t __p0) {
  62018   int16x4_t __ret;
  62019   __ret = (int16x4_t)(__p0);
  62020   return __ret;
  62021 }
  62022 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s32(int32x2_t __p0) {
  62023   int16x4_t __ret;
  62024   __ret = (int16x4_t)(__p0);
  62025   return __ret;
  62026 }
  62027 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s64(int64x1_t __p0) {
  62028   int16x4_t __ret;
  62029   __ret = (int16x4_t)(__p0);
  62030   return __ret;
  62031 }
  62032 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_mf8(mfloat8x8_t __p0) {
  62033   int16x4_t __ret;
  62034   __ret = (int16x4_t)(__p0);
  62035   return __ret;
  62036 }
  62037 __ai __attribute__((target("neon"))) uint64_t vrshld_u64(uint64_t __p0, int64_t __p1) {
  62038   uint64_t __ret;
  62039   __ret = (uint64_t) __builtin_neon_vrshld_u64(__p0, __p1);
  62040   return __ret;
  62041 }
  62042 __ai __attribute__((target("neon"))) int64_t vrshld_s64(int64_t __p0, int64_t __p1) {
  62043   int64_t __ret;
  62044   __ret = (int64_t) __builtin_neon_vrshld_s64(__p0, __p1);
  62045   return __ret;
  62046 }
  62047 #define vrshrd_n_u64(__p0, __p1) __extension__ ({ \
  62048   uint64_t __ret; \
  62049   uint64_t __s0 = __p0; \
  62050   __ret = (uint64_t) __builtin_neon_vrshrd_n_u64(__s0, __p1); \
  62051   __ret; \
  62052 })
  62053 #define vrshrd_n_s64(__p0, __p1) __extension__ ({ \
  62054   int64_t __ret; \
  62055   int64_t __s0 = __p0; \
  62056   __ret = (int64_t) __builtin_neon_vrshrd_n_s64(__s0, __p1); \
  62057   __ret; \
  62058 })
  62059 #ifdef __LITTLE_ENDIAN__
  62060 #define vrshrn_high_n_u32(__p0_724, __p1_724, __p2_724) __extension__ ({ \
  62061   uint16x8_t __ret_724; \
  62062   uint16x4_t __s0_724 = __p0_724; \
  62063   uint32x4_t __s1_724 = __p1_724; \
  62064   __ret_724 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_724), (uint16x4_t)(vrshrn_n_u32(__s1_724, __p2_724)))); \
  62065   __ret_724; \
  62066 })
  62067 #else
  62068 #define vrshrn_high_n_u32(__p0_725, __p1_725, __p2_725) __extension__ ({ \
  62069   uint16x8_t __ret_725; \
  62070   uint16x4_t __s0_725 = __p0_725; \
  62071   uint32x4_t __s1_725 = __p1_725; \
  62072   uint16x4_t __rev0_725;  __rev0_725 = __builtin_shufflevector(__s0_725, __s0_725, 3, 2, 1, 0); \
  62073   uint32x4_t __rev1_725;  __rev1_725 = __builtin_shufflevector(__s1_725, __s1_725, 3, 2, 1, 0); \
  62074   __ret_725 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_725), (uint16x4_t)(__noswap_vrshrn_n_u32(__rev1_725, __p2_725)))); \
  62075   __ret_725 = __builtin_shufflevector(__ret_725, __ret_725, 7, 6, 5, 4, 3, 2, 1, 0); \
  62076   __ret_725; \
  62077 })
  62078 #endif
  62079 
  62080 #ifdef __LITTLE_ENDIAN__
  62081 #define vrshrn_high_n_u64(__p0_726, __p1_726, __p2_726) __extension__ ({ \
  62082   uint32x4_t __ret_726; \
  62083   uint32x2_t __s0_726 = __p0_726; \
  62084   uint64x2_t __s1_726 = __p1_726; \
  62085   __ret_726 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_726), (uint32x2_t)(vrshrn_n_u64(__s1_726, __p2_726)))); \
  62086   __ret_726; \
  62087 })
  62088 #else
  62089 #define vrshrn_high_n_u64(__p0_727, __p1_727, __p2_727) __extension__ ({ \
  62090   uint32x4_t __ret_727; \
  62091   uint32x2_t __s0_727 = __p0_727; \
  62092   uint64x2_t __s1_727 = __p1_727; \
  62093   uint32x2_t __rev0_727;  __rev0_727 = __builtin_shufflevector(__s0_727, __s0_727, 1, 0); \
  62094   uint64x2_t __rev1_727;  __rev1_727 = __builtin_shufflevector(__s1_727, __s1_727, 1, 0); \
  62095   __ret_727 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_727), (uint32x2_t)(__noswap_vrshrn_n_u64(__rev1_727, __p2_727)))); \
  62096   __ret_727 = __builtin_shufflevector(__ret_727, __ret_727, 3, 2, 1, 0); \
  62097   __ret_727; \
  62098 })
  62099 #endif
  62100 
  62101 #ifdef __LITTLE_ENDIAN__
  62102 #define vrshrn_high_n_u16(__p0_728, __p1_728, __p2_728) __extension__ ({ \
  62103   uint8x16_t __ret_728; \
  62104   uint8x8_t __s0_728 = __p0_728; \
  62105   uint16x8_t __s1_728 = __p1_728; \
  62106   __ret_728 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_728), (uint8x8_t)(vrshrn_n_u16(__s1_728, __p2_728)))); \
  62107   __ret_728; \
  62108 })
  62109 #else
  62110 #define vrshrn_high_n_u16(__p0_729, __p1_729, __p2_729) __extension__ ({ \
  62111   uint8x16_t __ret_729; \
  62112   uint8x8_t __s0_729 = __p0_729; \
  62113   uint16x8_t __s1_729 = __p1_729; \
  62114   uint8x8_t __rev0_729;  __rev0_729 = __builtin_shufflevector(__s0_729, __s0_729, 7, 6, 5, 4, 3, 2, 1, 0); \
  62115   uint16x8_t __rev1_729;  __rev1_729 = __builtin_shufflevector(__s1_729, __s1_729, 7, 6, 5, 4, 3, 2, 1, 0); \
  62116   __ret_729 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_729), (uint8x8_t)(__noswap_vrshrn_n_u16(__rev1_729, __p2_729)))); \
  62117   __ret_729 = __builtin_shufflevector(__ret_729, __ret_729, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  62118   __ret_729; \
  62119 })
  62120 #endif
  62121 
  62122 #ifdef __LITTLE_ENDIAN__
  62123 #define vrshrn_high_n_s32(__p0_730, __p1_730, __p2_730) __extension__ ({ \
  62124   int16x8_t __ret_730; \
  62125   int16x4_t __s0_730 = __p0_730; \
  62126   int32x4_t __s1_730 = __p1_730; \
  62127   __ret_730 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_730), (int16x4_t)(vrshrn_n_s32(__s1_730, __p2_730)))); \
  62128   __ret_730; \
  62129 })
  62130 #else
  62131 #define vrshrn_high_n_s32(__p0_731, __p1_731, __p2_731) __extension__ ({ \
  62132   int16x8_t __ret_731; \
  62133   int16x4_t __s0_731 = __p0_731; \
  62134   int32x4_t __s1_731 = __p1_731; \
  62135   int16x4_t __rev0_731;  __rev0_731 = __builtin_shufflevector(__s0_731, __s0_731, 3, 2, 1, 0); \
  62136   int32x4_t __rev1_731;  __rev1_731 = __builtin_shufflevector(__s1_731, __s1_731, 3, 2, 1, 0); \
  62137   __ret_731 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_731), (int16x4_t)(__noswap_vrshrn_n_s32(__rev1_731, __p2_731)))); \
  62138   __ret_731 = __builtin_shufflevector(__ret_731, __ret_731, 7, 6, 5, 4, 3, 2, 1, 0); \
  62139   __ret_731; \
  62140 })
  62141 #endif
  62142 
  62143 #ifdef __LITTLE_ENDIAN__
  62144 #define vrshrn_high_n_s64(__p0_732, __p1_732, __p2_732) __extension__ ({ \
  62145   int32x4_t __ret_732; \
  62146   int32x2_t __s0_732 = __p0_732; \
  62147   int64x2_t __s1_732 = __p1_732; \
  62148   __ret_732 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_732), (int32x2_t)(vrshrn_n_s64(__s1_732, __p2_732)))); \
  62149   __ret_732; \
  62150 })
  62151 #else
  62152 #define vrshrn_high_n_s64(__p0_733, __p1_733, __p2_733) __extension__ ({ \
  62153   int32x4_t __ret_733; \
  62154   int32x2_t __s0_733 = __p0_733; \
  62155   int64x2_t __s1_733 = __p1_733; \
  62156   int32x2_t __rev0_733;  __rev0_733 = __builtin_shufflevector(__s0_733, __s0_733, 1, 0); \
  62157   int64x2_t __rev1_733;  __rev1_733 = __builtin_shufflevector(__s1_733, __s1_733, 1, 0); \
  62158   __ret_733 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_733), (int32x2_t)(__noswap_vrshrn_n_s64(__rev1_733, __p2_733)))); \
  62159   __ret_733 = __builtin_shufflevector(__ret_733, __ret_733, 3, 2, 1, 0); \
  62160   __ret_733; \
  62161 })
  62162 #endif
  62163 
  62164 #ifdef __LITTLE_ENDIAN__
  62165 #define vrshrn_high_n_s16(__p0_734, __p1_734, __p2_734) __extension__ ({ \
  62166   int8x16_t __ret_734; \
  62167   int8x8_t __s0_734 = __p0_734; \
  62168   int16x8_t __s1_734 = __p1_734; \
  62169   __ret_734 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_734), (int8x8_t)(vrshrn_n_s16(__s1_734, __p2_734)))); \
  62170   __ret_734; \
  62171 })
  62172 #else
  62173 #define vrshrn_high_n_s16(__p0_735, __p1_735, __p2_735) __extension__ ({ \
  62174   int8x16_t __ret_735; \
  62175   int8x8_t __s0_735 = __p0_735; \
  62176   int16x8_t __s1_735 = __p1_735; \
  62177   int8x8_t __rev0_735;  __rev0_735 = __builtin_shufflevector(__s0_735, __s0_735, 7, 6, 5, 4, 3, 2, 1, 0); \
  62178   int16x8_t __rev1_735;  __rev1_735 = __builtin_shufflevector(__s1_735, __s1_735, 7, 6, 5, 4, 3, 2, 1, 0); \
  62179   __ret_735 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_735), (int8x8_t)(__noswap_vrshrn_n_s16(__rev1_735, __p2_735)))); \
  62180   __ret_735 = __builtin_shufflevector(__ret_735, __ret_735, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  62181   __ret_735; \
  62182 })
  62183 #endif
  62184 
  62185 #ifdef __LITTLE_ENDIAN__
  62186 __ai __attribute__((target("neon"))) float64x2_t vrsqrteq_f64(float64x2_t __p0) {
  62187   float64x2_t __ret;
  62188   __ret = (float64x2_t) __builtin_neon_vrsqrteq_v((int8x16_t)__p0, 42);
  62189   return __ret;
  62190 }
  62191 #else
  62192 __ai __attribute__((target("neon"))) float64x2_t vrsqrteq_f64(float64x2_t __p0) {
  62193   float64x2_t __ret;
  62194   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62195   __ret = (float64x2_t) __builtin_neon_vrsqrteq_v((int8x16_t)__rev0, 42);
  62196   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  62197   return __ret;
  62198 }
  62199 #endif
  62200 
  62201 __ai __attribute__((target("neon"))) float64x1_t vrsqrte_f64(float64x1_t __p0) {
  62202   float64x1_t __ret;
  62203   __ret = (float64x1_t) __builtin_neon_vrsqrte_v((int8x8_t)__p0, 10);
  62204   return __ret;
  62205 }
  62206 __ai __attribute__((target("neon"))) float64_t vrsqrted_f64(float64_t __p0) {
  62207   float64_t __ret;
  62208   __ret = (float64_t) __builtin_neon_vrsqrted_f64(__p0);
  62209   return __ret;
  62210 }
  62211 __ai __attribute__((target("neon"))) float32_t vrsqrtes_f32(float32_t __p0) {
  62212   float32_t __ret;
  62213   __ret = (float32_t) __builtin_neon_vrsqrtes_f32(__p0);
  62214   return __ret;
  62215 }
  62216 #ifdef __LITTLE_ENDIAN__
  62217 __ai __attribute__((target("neon"))) float64x2_t vrsqrtsq_f64(float64x2_t __p0, float64x2_t __p1) {
  62218   float64x2_t __ret;
  62219   __ret = (float64x2_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__p0, (int8x16_t)__p1, 42);
  62220   return __ret;
  62221 }
  62222 #else
  62223 __ai __attribute__((target("neon"))) float64x2_t vrsqrtsq_f64(float64x2_t __p0, float64x2_t __p1) {
  62224   float64x2_t __ret;
  62225   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62226   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  62227   __ret = (float64x2_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  62228   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  62229   return __ret;
  62230 }
  62231 #endif
  62232 
  62233 __ai __attribute__((target("neon"))) float64x1_t vrsqrts_f64(float64x1_t __p0, float64x1_t __p1) {
  62234   float64x1_t __ret;
  62235   __ret = (float64x1_t) __builtin_neon_vrsqrts_v((int8x8_t)__p0, (int8x8_t)__p1, 10);
  62236   return __ret;
  62237 }
  62238 __ai __attribute__((target("neon"))) float64_t vrsqrtsd_f64(float64_t __p0, float64_t __p1) {
  62239   float64_t __ret;
  62240   __ret = (float64_t) __builtin_neon_vrsqrtsd_f64(__p0, __p1);
  62241   return __ret;
  62242 }
  62243 __ai __attribute__((target("neon"))) float32_t vrsqrtss_f32(float32_t __p0, float32_t __p1) {
  62244   float32_t __ret;
  62245   __ret = (float32_t) __builtin_neon_vrsqrtss_f32(__p0, __p1);
  62246   return __ret;
  62247 }
  62248 #define vrsrad_n_u64(__p0, __p1, __p2) __extension__ ({ \
  62249   uint64_t __ret; \
  62250   uint64_t __s0 = __p0; \
  62251   uint64_t __s1 = __p1; \
  62252   __ret = (uint64_t) __builtin_neon_vrsrad_n_u64(__s0, __s1, __p2); \
  62253   __ret; \
  62254 })
  62255 #define vrsrad_n_s64(__p0, __p1, __p2) __extension__ ({ \
  62256   int64_t __ret; \
  62257   int64_t __s0 = __p0; \
  62258   int64_t __s1 = __p1; \
  62259   __ret = (int64_t) __builtin_neon_vrsrad_n_s64(__s0, __s1, __p2); \
  62260   __ret; \
  62261 })
  62262 #ifdef __LITTLE_ENDIAN__
  62263 __ai __attribute__((target("neon"))) uint16x8_t vrsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  62264   uint16x8_t __ret;
  62265   __ret = vcombine_u16(__p0, vrsubhn_u32(__p1, __p2));
  62266   return __ret;
  62267 }
  62268 #else
  62269 __ai __attribute__((target("neon"))) uint16x8_t vrsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  62270   uint16x8_t __ret;
  62271   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  62272   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  62273   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  62274   __ret = __noswap_vcombine_u16(__rev0, __noswap_vrsubhn_u32(__rev1, __rev2));
  62275   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  62276   return __ret;
  62277 }
  62278 #endif
  62279 
  62280 #ifdef __LITTLE_ENDIAN__
  62281 __ai __attribute__((target("neon"))) uint32x4_t vrsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  62282   uint32x4_t __ret;
  62283   __ret = vcombine_u32(__p0, vrsubhn_u64(__p1, __p2));
  62284   return __ret;
  62285 }
  62286 #else
  62287 __ai __attribute__((target("neon"))) uint32x4_t vrsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  62288   uint32x4_t __ret;
  62289   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62290   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  62291   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  62292   __ret = __noswap_vcombine_u32(__rev0, __noswap_vrsubhn_u64(__rev1, __rev2));
  62293   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  62294   return __ret;
  62295 }
  62296 #endif
  62297 
  62298 #ifdef __LITTLE_ENDIAN__
  62299 __ai __attribute__((target("neon"))) uint8x16_t vrsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  62300   uint8x16_t __ret;
  62301   __ret = vcombine_u8(__p0, vrsubhn_u16(__p1, __p2));
  62302   return __ret;
  62303 }
  62304 #else
  62305 __ai __attribute__((target("neon"))) uint8x16_t vrsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  62306   uint8x16_t __ret;
  62307   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  62308   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  62309   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  62310   __ret = __noswap_vcombine_u8(__rev0, __noswap_vrsubhn_u16(__rev1, __rev2));
  62311   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  62312   return __ret;
  62313 }
  62314 #endif
  62315 
  62316 #ifdef __LITTLE_ENDIAN__
  62317 __ai __attribute__((target("neon"))) int16x8_t vrsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  62318   int16x8_t __ret;
  62319   __ret = vcombine_s16(__p0, vrsubhn_s32(__p1, __p2));
  62320   return __ret;
  62321 }
  62322 #else
  62323 __ai __attribute__((target("neon"))) int16x8_t vrsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  62324   int16x8_t __ret;
  62325   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  62326   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  62327   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  62328   __ret = __noswap_vcombine_s16(__rev0, __noswap_vrsubhn_s32(__rev1, __rev2));
  62329   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  62330   return __ret;
  62331 }
  62332 #endif
  62333 
  62334 #ifdef __LITTLE_ENDIAN__
  62335 __ai __attribute__((target("neon"))) int32x4_t vrsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  62336   int32x4_t __ret;
  62337   __ret = vcombine_s32(__p0, vrsubhn_s64(__p1, __p2));
  62338   return __ret;
  62339 }
  62340 #else
  62341 __ai __attribute__((target("neon"))) int32x4_t vrsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  62342   int32x4_t __ret;
  62343   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62344   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  62345   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  62346   __ret = __noswap_vcombine_s32(__rev0, __noswap_vrsubhn_s64(__rev1, __rev2));
  62347   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  62348   return __ret;
  62349 }
  62350 #endif
  62351 
  62352 #ifdef __LITTLE_ENDIAN__
  62353 __ai __attribute__((target("neon"))) int8x16_t vrsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  62354   int8x16_t __ret;
  62355   __ret = vcombine_s8(__p0, vrsubhn_s16(__p1, __p2));
  62356   return __ret;
  62357 }
  62358 #else
  62359 __ai __attribute__((target("neon"))) int8x16_t vrsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  62360   int8x16_t __ret;
  62361   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  62362   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  62363   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  62364   __ret = __noswap_vcombine_s8(__rev0, __noswap_vrsubhn_s16(__rev1, __rev2));
  62365   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  62366   return __ret;
  62367 }
  62368 #endif
  62369 
  62370 #define vset_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  62371   poly64x1_t __ret; \
  62372   poly64_t __s0 = __p0; \
  62373   poly64x1_t __s1 = __p1; \
  62374   __ret = (poly64x1_t) __builtin_neon_vset_lane_i64(__s0, (poly64x1_t)__s1, __p2); \
  62375   __ret; \
  62376 })
  62377 #ifdef __LITTLE_ENDIAN__
  62378 #define vsetq_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  62379   poly64x2_t __ret; \
  62380   poly64_t __s0 = __p0; \
  62381   poly64x2_t __s1 = __p1; \
  62382   __ret = (poly64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (poly64x2_t)__s1, __p2); \
  62383   __ret; \
  62384 })
  62385 #else
  62386 #define vsetq_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  62387   poly64x2_t __ret; \
  62388   poly64_t __s0 = __p0; \
  62389   poly64x2_t __s1 = __p1; \
  62390   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  62391   __ret = (poly64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (poly64x2_t)__rev1, __p2); \
  62392   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  62393   __ret; \
  62394 })
  62395 #define __noswap_vsetq_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  62396   poly64x2_t __ret; \
  62397   poly64_t __s0 = __p0; \
  62398   poly64x2_t __s1 = __p1; \
  62399   __ret = (poly64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (poly64x2_t)__s1, __p2); \
  62400   __ret; \
  62401 })
  62402 #endif
  62403 
  62404 #ifdef __LITTLE_ENDIAN__
  62405 #define vsetq_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  62406   float64x2_t __ret; \
  62407   float64_t __s0 = __p0; \
  62408   float64x2_t __s1 = __p1; \
  62409   __ret = (float64x2_t) __builtin_neon_vsetq_lane_f64(__s0, (float64x2_t)__s1, __p2); \
  62410   __ret; \
  62411 })
  62412 #else
  62413 #define vsetq_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  62414   float64x2_t __ret; \
  62415   float64_t __s0 = __p0; \
  62416   float64x2_t __s1 = __p1; \
  62417   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  62418   __ret = (float64x2_t) __builtin_neon_vsetq_lane_f64(__s0, (float64x2_t)__rev1, __p2); \
  62419   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  62420   __ret; \
  62421 })
  62422 #define __noswap_vsetq_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  62423   float64x2_t __ret; \
  62424   float64_t __s0 = __p0; \
  62425   float64x2_t __s1 = __p1; \
  62426   __ret = (float64x2_t) __builtin_neon_vsetq_lane_f64(__s0, (float64x2_t)__s1, __p2); \
  62427   __ret; \
  62428 })
  62429 #endif
  62430 
  62431 #define vset_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  62432   float64x1_t __ret; \
  62433   float64_t __s0 = __p0; \
  62434   float64x1_t __s1 = __p1; \
  62435   __ret = (float64x1_t) __builtin_neon_vset_lane_f64(__s0, (float64x1_t)__s1, __p2); \
  62436   __ret; \
  62437 })
  62438 __ai __attribute__((target("neon"))) uint64_t vshld_u64(uint64_t __p0, int64_t __p1) {
  62439   uint64_t __ret;
  62440   __ret = (uint64_t) __builtin_neon_vshld_u64(__p0, __p1);
  62441   return __ret;
  62442 }
  62443 __ai __attribute__((target("neon"))) int64_t vshld_s64(int64_t __p0, int64_t __p1) {
  62444   int64_t __ret;
  62445   __ret = (int64_t) __builtin_neon_vshld_s64(__p0, __p1);
  62446   return __ret;
  62447 }
  62448 #define vshld_n_u64(__p0, __p1) __extension__ ({ \
  62449   uint64_t __ret; \
  62450   uint64_t __s0 = __p0; \
  62451   __ret = (uint64_t) __builtin_neon_vshld_n_u64(__s0, __p1); \
  62452   __ret; \
  62453 })
  62454 #define vshld_n_s64(__p0, __p1) __extension__ ({ \
  62455   int64_t __ret; \
  62456   int64_t __s0 = __p0; \
  62457   __ret = (int64_t) __builtin_neon_vshld_n_s64(__s0, __p1); \
  62458   __ret; \
  62459 })
  62460 #ifdef __LITTLE_ENDIAN__
  62461 #define vshll_high_n_u8(__p0_736, __p1_736) __extension__ ({ \
  62462   uint16x8_t __ret_736; \
  62463   uint8x16_t __s0_736 = __p0_736; \
  62464   __ret_736 = (uint16x8_t)(vshll_n_u8(vget_high_u8(__s0_736), __p1_736)); \
  62465   __ret_736; \
  62466 })
  62467 #else
  62468 #define vshll_high_n_u8(__p0_737, __p1_737) __extension__ ({ \
  62469   uint16x8_t __ret_737; \
  62470   uint8x16_t __s0_737 = __p0_737; \
  62471   uint8x16_t __rev0_737;  __rev0_737 = __builtin_shufflevector(__s0_737, __s0_737, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  62472   __ret_737 = (uint16x8_t)(__noswap_vshll_n_u8(__noswap_vget_high_u8(__rev0_737), __p1_737)); \
  62473   __ret_737 = __builtin_shufflevector(__ret_737, __ret_737, 7, 6, 5, 4, 3, 2, 1, 0); \
  62474   __ret_737; \
  62475 })
  62476 #endif
  62477 
  62478 #ifdef __LITTLE_ENDIAN__
  62479 #define vshll_high_n_u32(__p0_738, __p1_738) __extension__ ({ \
  62480   uint64x2_t __ret_738; \
  62481   uint32x4_t __s0_738 = __p0_738; \
  62482   __ret_738 = (uint64x2_t)(vshll_n_u32(vget_high_u32(__s0_738), __p1_738)); \
  62483   __ret_738; \
  62484 })
  62485 #else
  62486 #define vshll_high_n_u32(__p0_739, __p1_739) __extension__ ({ \
  62487   uint64x2_t __ret_739; \
  62488   uint32x4_t __s0_739 = __p0_739; \
  62489   uint32x4_t __rev0_739;  __rev0_739 = __builtin_shufflevector(__s0_739, __s0_739, 3, 2, 1, 0); \
  62490   __ret_739 = (uint64x2_t)(__noswap_vshll_n_u32(__noswap_vget_high_u32(__rev0_739), __p1_739)); \
  62491   __ret_739 = __builtin_shufflevector(__ret_739, __ret_739, 1, 0); \
  62492   __ret_739; \
  62493 })
  62494 #endif
  62495 
  62496 #ifdef __LITTLE_ENDIAN__
  62497 #define vshll_high_n_u16(__p0_740, __p1_740) __extension__ ({ \
  62498   uint32x4_t __ret_740; \
  62499   uint16x8_t __s0_740 = __p0_740; \
  62500   __ret_740 = (uint32x4_t)(vshll_n_u16(vget_high_u16(__s0_740), __p1_740)); \
  62501   __ret_740; \
  62502 })
  62503 #else
  62504 #define vshll_high_n_u16(__p0_741, __p1_741) __extension__ ({ \
  62505   uint32x4_t __ret_741; \
  62506   uint16x8_t __s0_741 = __p0_741; \
  62507   uint16x8_t __rev0_741;  __rev0_741 = __builtin_shufflevector(__s0_741, __s0_741, 7, 6, 5, 4, 3, 2, 1, 0); \
  62508   __ret_741 = (uint32x4_t)(__noswap_vshll_n_u16(__noswap_vget_high_u16(__rev0_741), __p1_741)); \
  62509   __ret_741 = __builtin_shufflevector(__ret_741, __ret_741, 3, 2, 1, 0); \
  62510   __ret_741; \
  62511 })
  62512 #endif
  62513 
  62514 #ifdef __LITTLE_ENDIAN__
  62515 #define vshll_high_n_s8(__p0_742, __p1_742) __extension__ ({ \
  62516   int16x8_t __ret_742; \
  62517   int8x16_t __s0_742 = __p0_742; \
  62518   __ret_742 = (int16x8_t)(vshll_n_s8(vget_high_s8(__s0_742), __p1_742)); \
  62519   __ret_742; \
  62520 })
  62521 #else
  62522 #define vshll_high_n_s8(__p0_743, __p1_743) __extension__ ({ \
  62523   int16x8_t __ret_743; \
  62524   int8x16_t __s0_743 = __p0_743; \
  62525   int8x16_t __rev0_743;  __rev0_743 = __builtin_shufflevector(__s0_743, __s0_743, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  62526   __ret_743 = (int16x8_t)(__noswap_vshll_n_s8(__noswap_vget_high_s8(__rev0_743), __p1_743)); \
  62527   __ret_743 = __builtin_shufflevector(__ret_743, __ret_743, 7, 6, 5, 4, 3, 2, 1, 0); \
  62528   __ret_743; \
  62529 })
  62530 #endif
  62531 
  62532 #ifdef __LITTLE_ENDIAN__
  62533 #define vshll_high_n_s32(__p0_744, __p1_744) __extension__ ({ \
  62534   int64x2_t __ret_744; \
  62535   int32x4_t __s0_744 = __p0_744; \
  62536   __ret_744 = (int64x2_t)(vshll_n_s32(vget_high_s32(__s0_744), __p1_744)); \
  62537   __ret_744; \
  62538 })
  62539 #else
  62540 #define vshll_high_n_s32(__p0_745, __p1_745) __extension__ ({ \
  62541   int64x2_t __ret_745; \
  62542   int32x4_t __s0_745 = __p0_745; \
  62543   int32x4_t __rev0_745;  __rev0_745 = __builtin_shufflevector(__s0_745, __s0_745, 3, 2, 1, 0); \
  62544   __ret_745 = (int64x2_t)(__noswap_vshll_n_s32(__noswap_vget_high_s32(__rev0_745), __p1_745)); \
  62545   __ret_745 = __builtin_shufflevector(__ret_745, __ret_745, 1, 0); \
  62546   __ret_745; \
  62547 })
  62548 #endif
  62549 
  62550 #ifdef __LITTLE_ENDIAN__
  62551 #define vshll_high_n_s16(__p0_746, __p1_746) __extension__ ({ \
  62552   int32x4_t __ret_746; \
  62553   int16x8_t __s0_746 = __p0_746; \
  62554   __ret_746 = (int32x4_t)(vshll_n_s16(vget_high_s16(__s0_746), __p1_746)); \
  62555   __ret_746; \
  62556 })
  62557 #else
  62558 #define vshll_high_n_s16(__p0_747, __p1_747) __extension__ ({ \
  62559   int32x4_t __ret_747; \
  62560   int16x8_t __s0_747 = __p0_747; \
  62561   int16x8_t __rev0_747;  __rev0_747 = __builtin_shufflevector(__s0_747, __s0_747, 7, 6, 5, 4, 3, 2, 1, 0); \
  62562   __ret_747 = (int32x4_t)(__noswap_vshll_n_s16(__noswap_vget_high_s16(__rev0_747), __p1_747)); \
  62563   __ret_747 = __builtin_shufflevector(__ret_747, __ret_747, 3, 2, 1, 0); \
  62564   __ret_747; \
  62565 })
  62566 #endif
  62567 
  62568 #define vshrd_n_u64(__p0, __p1) __extension__ ({ \
  62569   uint64_t __ret; \
  62570   uint64_t __s0 = __p0; \
  62571   __ret = (uint64_t) __builtin_neon_vshrd_n_u64(__s0, __p1); \
  62572   __ret; \
  62573 })
  62574 #define vshrd_n_s64(__p0, __p1) __extension__ ({ \
  62575   int64_t __ret; \
  62576   int64_t __s0 = __p0; \
  62577   __ret = (int64_t) __builtin_neon_vshrd_n_s64(__s0, __p1); \
  62578   __ret; \
  62579 })
  62580 #ifdef __LITTLE_ENDIAN__
  62581 #define vshrn_high_n_u32(__p0_748, __p1_748, __p2_748) __extension__ ({ \
  62582   uint16x8_t __ret_748; \
  62583   uint16x4_t __s0_748 = __p0_748; \
  62584   uint32x4_t __s1_748 = __p1_748; \
  62585   __ret_748 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_748), (uint16x4_t)(vshrn_n_u32(__s1_748, __p2_748)))); \
  62586   __ret_748; \
  62587 })
  62588 #else
  62589 #define vshrn_high_n_u32(__p0_749, __p1_749, __p2_749) __extension__ ({ \
  62590   uint16x8_t __ret_749; \
  62591   uint16x4_t __s0_749 = __p0_749; \
  62592   uint32x4_t __s1_749 = __p1_749; \
  62593   uint16x4_t __rev0_749;  __rev0_749 = __builtin_shufflevector(__s0_749, __s0_749, 3, 2, 1, 0); \
  62594   uint32x4_t __rev1_749;  __rev1_749 = __builtin_shufflevector(__s1_749, __s1_749, 3, 2, 1, 0); \
  62595   __ret_749 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_749), (uint16x4_t)(__noswap_vshrn_n_u32(__rev1_749, __p2_749)))); \
  62596   __ret_749 = __builtin_shufflevector(__ret_749, __ret_749, 7, 6, 5, 4, 3, 2, 1, 0); \
  62597   __ret_749; \
  62598 })
  62599 #endif
  62600 
  62601 #ifdef __LITTLE_ENDIAN__
  62602 #define vshrn_high_n_u64(__p0_750, __p1_750, __p2_750) __extension__ ({ \
  62603   uint32x4_t __ret_750; \
  62604   uint32x2_t __s0_750 = __p0_750; \
  62605   uint64x2_t __s1_750 = __p1_750; \
  62606   __ret_750 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_750), (uint32x2_t)(vshrn_n_u64(__s1_750, __p2_750)))); \
  62607   __ret_750; \
  62608 })
  62609 #else
  62610 #define vshrn_high_n_u64(__p0_751, __p1_751, __p2_751) __extension__ ({ \
  62611   uint32x4_t __ret_751; \
  62612   uint32x2_t __s0_751 = __p0_751; \
  62613   uint64x2_t __s1_751 = __p1_751; \
  62614   uint32x2_t __rev0_751;  __rev0_751 = __builtin_shufflevector(__s0_751, __s0_751, 1, 0); \
  62615   uint64x2_t __rev1_751;  __rev1_751 = __builtin_shufflevector(__s1_751, __s1_751, 1, 0); \
  62616   __ret_751 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_751), (uint32x2_t)(__noswap_vshrn_n_u64(__rev1_751, __p2_751)))); \
  62617   __ret_751 = __builtin_shufflevector(__ret_751, __ret_751, 3, 2, 1, 0); \
  62618   __ret_751; \
  62619 })
  62620 #endif
  62621 
  62622 #ifdef __LITTLE_ENDIAN__
  62623 #define vshrn_high_n_u16(__p0_752, __p1_752, __p2_752) __extension__ ({ \
  62624   uint8x16_t __ret_752; \
  62625   uint8x8_t __s0_752 = __p0_752; \
  62626   uint16x8_t __s1_752 = __p1_752; \
  62627   __ret_752 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_752), (uint8x8_t)(vshrn_n_u16(__s1_752, __p2_752)))); \
  62628   __ret_752; \
  62629 })
  62630 #else
  62631 #define vshrn_high_n_u16(__p0_753, __p1_753, __p2_753) __extension__ ({ \
  62632   uint8x16_t __ret_753; \
  62633   uint8x8_t __s0_753 = __p0_753; \
  62634   uint16x8_t __s1_753 = __p1_753; \
  62635   uint8x8_t __rev0_753;  __rev0_753 = __builtin_shufflevector(__s0_753, __s0_753, 7, 6, 5, 4, 3, 2, 1, 0); \
  62636   uint16x8_t __rev1_753;  __rev1_753 = __builtin_shufflevector(__s1_753, __s1_753, 7, 6, 5, 4, 3, 2, 1, 0); \
  62637   __ret_753 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_753), (uint8x8_t)(__noswap_vshrn_n_u16(__rev1_753, __p2_753)))); \
  62638   __ret_753 = __builtin_shufflevector(__ret_753, __ret_753, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  62639   __ret_753; \
  62640 })
  62641 #endif
  62642 
  62643 #ifdef __LITTLE_ENDIAN__
  62644 #define vshrn_high_n_s32(__p0_754, __p1_754, __p2_754) __extension__ ({ \
  62645   int16x8_t __ret_754; \
  62646   int16x4_t __s0_754 = __p0_754; \
  62647   int32x4_t __s1_754 = __p1_754; \
  62648   __ret_754 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_754), (int16x4_t)(vshrn_n_s32(__s1_754, __p2_754)))); \
  62649   __ret_754; \
  62650 })
  62651 #else
  62652 #define vshrn_high_n_s32(__p0_755, __p1_755, __p2_755) __extension__ ({ \
  62653   int16x8_t __ret_755; \
  62654   int16x4_t __s0_755 = __p0_755; \
  62655   int32x4_t __s1_755 = __p1_755; \
  62656   int16x4_t __rev0_755;  __rev0_755 = __builtin_shufflevector(__s0_755, __s0_755, 3, 2, 1, 0); \
  62657   int32x4_t __rev1_755;  __rev1_755 = __builtin_shufflevector(__s1_755, __s1_755, 3, 2, 1, 0); \
  62658   __ret_755 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_755), (int16x4_t)(__noswap_vshrn_n_s32(__rev1_755, __p2_755)))); \
  62659   __ret_755 = __builtin_shufflevector(__ret_755, __ret_755, 7, 6, 5, 4, 3, 2, 1, 0); \
  62660   __ret_755; \
  62661 })
  62662 #endif
  62663 
  62664 #ifdef __LITTLE_ENDIAN__
  62665 #define vshrn_high_n_s64(__p0_756, __p1_756, __p2_756) __extension__ ({ \
  62666   int32x4_t __ret_756; \
  62667   int32x2_t __s0_756 = __p0_756; \
  62668   int64x2_t __s1_756 = __p1_756; \
  62669   __ret_756 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_756), (int32x2_t)(vshrn_n_s64(__s1_756, __p2_756)))); \
  62670   __ret_756; \
  62671 })
  62672 #else
  62673 #define vshrn_high_n_s64(__p0_757, __p1_757, __p2_757) __extension__ ({ \
  62674   int32x4_t __ret_757; \
  62675   int32x2_t __s0_757 = __p0_757; \
  62676   int64x2_t __s1_757 = __p1_757; \
  62677   int32x2_t __rev0_757;  __rev0_757 = __builtin_shufflevector(__s0_757, __s0_757, 1, 0); \
  62678   int64x2_t __rev1_757;  __rev1_757 = __builtin_shufflevector(__s1_757, __s1_757, 1, 0); \
  62679   __ret_757 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_757), (int32x2_t)(__noswap_vshrn_n_s64(__rev1_757, __p2_757)))); \
  62680   __ret_757 = __builtin_shufflevector(__ret_757, __ret_757, 3, 2, 1, 0); \
  62681   __ret_757; \
  62682 })
  62683 #endif
  62684 
  62685 #ifdef __LITTLE_ENDIAN__
  62686 #define vshrn_high_n_s16(__p0_758, __p1_758, __p2_758) __extension__ ({ \
  62687   int8x16_t __ret_758; \
  62688   int8x8_t __s0_758 = __p0_758; \
  62689   int16x8_t __s1_758 = __p1_758; \
  62690   __ret_758 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_758), (int8x8_t)(vshrn_n_s16(__s1_758, __p2_758)))); \
  62691   __ret_758; \
  62692 })
  62693 #else
  62694 #define vshrn_high_n_s16(__p0_759, __p1_759, __p2_759) __extension__ ({ \
  62695   int8x16_t __ret_759; \
  62696   int8x8_t __s0_759 = __p0_759; \
  62697   int16x8_t __s1_759 = __p1_759; \
  62698   int8x8_t __rev0_759;  __rev0_759 = __builtin_shufflevector(__s0_759, __s0_759, 7, 6, 5, 4, 3, 2, 1, 0); \
  62699   int16x8_t __rev1_759;  __rev1_759 = __builtin_shufflevector(__s1_759, __s1_759, 7, 6, 5, 4, 3, 2, 1, 0); \
  62700   __ret_759 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_759), (int8x8_t)(__noswap_vshrn_n_s16(__rev1_759, __p2_759)))); \
  62701   __ret_759 = __builtin_shufflevector(__ret_759, __ret_759, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  62702   __ret_759; \
  62703 })
  62704 #endif
  62705 
  62706 #define vslid_n_u64(__p0, __p1, __p2) __extension__ ({ \
  62707   uint64_t __ret; \
  62708   uint64_t __s0 = __p0; \
  62709   uint64_t __s1 = __p1; \
  62710   __ret = (uint64_t) __builtin_neon_vslid_n_u64(__s0, __s1, __p2); \
  62711   __ret; \
  62712 })
  62713 #define vslid_n_s64(__p0, __p1, __p2) __extension__ ({ \
  62714   int64_t __ret; \
  62715   int64_t __s0 = __p0; \
  62716   int64_t __s1 = __p1; \
  62717   __ret = (int64_t) __builtin_neon_vslid_n_s64(__s0, __s1, __p2); \
  62718   __ret; \
  62719 })
  62720 #define vsli_n_p64(__p0, __p1, __p2) __extension__ ({ \
  62721   poly64x1_t __ret; \
  62722   poly64x1_t __s0 = __p0; \
  62723   poly64x1_t __s1 = __p1; \
  62724   __ret = (poly64x1_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 6); \
  62725   __ret; \
  62726 })
  62727 #ifdef __LITTLE_ENDIAN__
  62728 #define vsliq_n_p64(__p0, __p1, __p2) __extension__ ({ \
  62729   poly64x2_t __ret; \
  62730   poly64x2_t __s0 = __p0; \
  62731   poly64x2_t __s1 = __p1; \
  62732   __ret = (poly64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 38); \
  62733   __ret; \
  62734 })
  62735 #else
  62736 #define vsliq_n_p64(__p0, __p1, __p2) __extension__ ({ \
  62737   poly64x2_t __ret; \
  62738   poly64x2_t __s0 = __p0; \
  62739   poly64x2_t __s1 = __p1; \
  62740   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  62741   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  62742   __ret = (poly64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 38); \
  62743   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  62744   __ret; \
  62745 })
  62746 #endif
  62747 
  62748 __ai __attribute__((target("neon"))) uint8_t vsqaddb_u8(uint8_t __p0, int8_t __p1) {
  62749   uint8_t __ret;
  62750   __ret = (uint8_t) __builtin_neon_vsqaddb_u8(__p0, __p1);
  62751   return __ret;
  62752 }
  62753 __ai __attribute__((target("neon"))) uint32_t vsqadds_u32(uint32_t __p0, int32_t __p1) {
  62754   uint32_t __ret;
  62755   __ret = (uint32_t) __builtin_neon_vsqadds_u32(__p0, __p1);
  62756   return __ret;
  62757 }
  62758 __ai __attribute__((target("neon"))) uint64_t vsqaddd_u64(uint64_t __p0, int64_t __p1) {
  62759   uint64_t __ret;
  62760   __ret = (uint64_t) __builtin_neon_vsqaddd_u64(__p0, __p1);
  62761   return __ret;
  62762 }
  62763 __ai __attribute__((target("neon"))) uint16_t vsqaddh_u16(uint16_t __p0, int16_t __p1) {
  62764   uint16_t __ret;
  62765   __ret = (uint16_t) __builtin_neon_vsqaddh_u16(__p0, __p1);
  62766   return __ret;
  62767 }
  62768 #ifdef __LITTLE_ENDIAN__
  62769 __ai __attribute__((target("neon"))) uint8x16_t vsqaddq_u8(uint8x16_t __p0, int8x16_t __p1) {
  62770   uint8x16_t __ret;
  62771   __ret = (uint8x16_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48);
  62772   return __ret;
  62773 }
  62774 #else
  62775 __ai __attribute__((target("neon"))) uint8x16_t vsqaddq_u8(uint8x16_t __p0, int8x16_t __p1) {
  62776   uint8x16_t __ret;
  62777   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  62778   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  62779   __ret = (uint8x16_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48);
  62780   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  62781   return __ret;
  62782 }
  62783 #endif
  62784 
  62785 #ifdef __LITTLE_ENDIAN__
  62786 __ai __attribute__((target("neon"))) uint32x4_t vsqaddq_u32(uint32x4_t __p0, int32x4_t __p1) {
  62787   uint32x4_t __ret;
  62788   __ret = (uint32x4_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50);
  62789   return __ret;
  62790 }
  62791 #else
  62792 __ai __attribute__((target("neon"))) uint32x4_t vsqaddq_u32(uint32x4_t __p0, int32x4_t __p1) {
  62793   uint32x4_t __ret;
  62794   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  62795   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  62796   __ret = (uint32x4_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  62797   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  62798   return __ret;
  62799 }
  62800 #endif
  62801 
  62802 #ifdef __LITTLE_ENDIAN__
  62803 __ai __attribute__((target("neon"))) uint64x2_t vsqaddq_u64(uint64x2_t __p0, int64x2_t __p1) {
  62804   uint64x2_t __ret;
  62805   __ret = (uint64x2_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  62806   return __ret;
  62807 }
  62808 #else
  62809 __ai __attribute__((target("neon"))) uint64x2_t vsqaddq_u64(uint64x2_t __p0, int64x2_t __p1) {
  62810   uint64x2_t __ret;
  62811   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62812   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  62813   __ret = (uint64x2_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  62814   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  62815   return __ret;
  62816 }
  62817 #endif
  62818 
  62819 #ifdef __LITTLE_ENDIAN__
  62820 __ai __attribute__((target("neon"))) uint16x8_t vsqaddq_u16(uint16x8_t __p0, int16x8_t __p1) {
  62821   uint16x8_t __ret;
  62822   __ret = (uint16x8_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49);
  62823   return __ret;
  62824 }
  62825 #else
  62826 __ai __attribute__((target("neon"))) uint16x8_t vsqaddq_u16(uint16x8_t __p0, int16x8_t __p1) {
  62827   uint16x8_t __ret;
  62828   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  62829   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  62830   __ret = (uint16x8_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49);
  62831   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  62832   return __ret;
  62833 }
  62834 #endif
  62835 
  62836 #ifdef __LITTLE_ENDIAN__
  62837 __ai __attribute__((target("neon"))) uint8x8_t vsqadd_u8(uint8x8_t __p0, int8x8_t __p1) {
  62838   uint8x8_t __ret;
  62839   __ret = (uint8x8_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16);
  62840   return __ret;
  62841 }
  62842 #else
  62843 __ai __attribute__((target("neon"))) uint8x8_t vsqadd_u8(uint8x8_t __p0, int8x8_t __p1) {
  62844   uint8x8_t __ret;
  62845   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  62846   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  62847   __ret = (uint8x8_t) __builtin_neon_vsqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16);
  62848   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  62849   return __ret;
  62850 }
  62851 #endif
  62852 
  62853 #ifdef __LITTLE_ENDIAN__
  62854 __ai __attribute__((target("neon"))) uint32x2_t vsqadd_u32(uint32x2_t __p0, int32x2_t __p1) {
  62855   uint32x2_t __ret;
  62856   __ret = (uint32x2_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18);
  62857   return __ret;
  62858 }
  62859 #else
  62860 __ai __attribute__((target("neon"))) uint32x2_t vsqadd_u32(uint32x2_t __p0, int32x2_t __p1) {
  62861   uint32x2_t __ret;
  62862   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62863   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  62864   __ret = (uint32x2_t) __builtin_neon_vsqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18);
  62865   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  62866   return __ret;
  62867 }
  62868 #endif
  62869 
  62870 __ai __attribute__((target("neon"))) uint64x1_t vsqadd_u64(uint64x1_t __p0, int64x1_t __p1) {
  62871   uint64x1_t __ret;
  62872   __ret = (uint64x1_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  62873   return __ret;
  62874 }
  62875 #ifdef __LITTLE_ENDIAN__
  62876 __ai __attribute__((target("neon"))) uint16x4_t vsqadd_u16(uint16x4_t __p0, int16x4_t __p1) {
  62877   uint16x4_t __ret;
  62878   __ret = (uint16x4_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17);
  62879   return __ret;
  62880 }
  62881 #else
  62882 __ai __attribute__((target("neon"))) uint16x4_t vsqadd_u16(uint16x4_t __p0, int16x4_t __p1) {
  62883   uint16x4_t __ret;
  62884   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  62885   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  62886   __ret = (uint16x4_t) __builtin_neon_vsqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17);
  62887   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  62888   return __ret;
  62889 }
  62890 #endif
  62891 
  62892 #ifdef __LITTLE_ENDIAN__
  62893 __ai __attribute__((target("neon"))) float64x2_t vsqrtq_f64(float64x2_t __p0) {
  62894   float64x2_t __ret;
  62895   __ret = (float64x2_t) __builtin_neon_vsqrtq_v((int8x16_t)__p0, 42);
  62896   return __ret;
  62897 }
  62898 #else
  62899 __ai __attribute__((target("neon"))) float64x2_t vsqrtq_f64(float64x2_t __p0) {
  62900   float64x2_t __ret;
  62901   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62902   __ret = (float64x2_t) __builtin_neon_vsqrtq_v((int8x16_t)__rev0, 42);
  62903   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  62904   return __ret;
  62905 }
  62906 #endif
  62907 
  62908 #ifdef __LITTLE_ENDIAN__
  62909 __ai __attribute__((target("neon"))) float32x4_t vsqrtq_f32(float32x4_t __p0) {
  62910   float32x4_t __ret;
  62911   __ret = (float32x4_t) __builtin_neon_vsqrtq_v((int8x16_t)__p0, 41);
  62912   return __ret;
  62913 }
  62914 #else
  62915 __ai __attribute__((target("neon"))) float32x4_t vsqrtq_f32(float32x4_t __p0) {
  62916   float32x4_t __ret;
  62917   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  62918   __ret = (float32x4_t) __builtin_neon_vsqrtq_v((int8x16_t)__rev0, 41);
  62919   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  62920   return __ret;
  62921 }
  62922 #endif
  62923 
  62924 __ai __attribute__((target("neon"))) float64x1_t vsqrt_f64(float64x1_t __p0) {
  62925   float64x1_t __ret;
  62926   __ret = (float64x1_t) __builtin_neon_vsqrt_v((int8x8_t)__p0, 10);
  62927   return __ret;
  62928 }
  62929 #ifdef __LITTLE_ENDIAN__
  62930 __ai __attribute__((target("neon"))) float32x2_t vsqrt_f32(float32x2_t __p0) {
  62931   float32x2_t __ret;
  62932   __ret = (float32x2_t) __builtin_neon_vsqrt_v((int8x8_t)__p0, 9);
  62933   return __ret;
  62934 }
  62935 #else
  62936 __ai __attribute__((target("neon"))) float32x2_t vsqrt_f32(float32x2_t __p0) {
  62937   float32x2_t __ret;
  62938   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  62939   __ret = (float32x2_t) __builtin_neon_vsqrt_v((int8x8_t)__rev0, 9);
  62940   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  62941   return __ret;
  62942 }
  62943 #endif
  62944 
  62945 #define vsrad_n_u64(__p0, __p1, __p2) __extension__ ({ \
  62946   uint64_t __ret; \
  62947   uint64_t __s0 = __p0; \
  62948   uint64_t __s1 = __p1; \
  62949   __ret = (uint64_t) __builtin_neon_vsrad_n_u64(__s0, __s1, __p2); \
  62950   __ret; \
  62951 })
  62952 #define vsrad_n_s64(__p0, __p1, __p2) __extension__ ({ \
  62953   int64_t __ret; \
  62954   int64_t __s0 = __p0; \
  62955   int64_t __s1 = __p1; \
  62956   __ret = (int64_t) __builtin_neon_vsrad_n_s64(__s0, __s1, __p2); \
  62957   __ret; \
  62958 })
  62959 #define vsrid_n_u64(__p0, __p1, __p2) __extension__ ({ \
  62960   uint64_t __ret; \
  62961   uint64_t __s0 = __p0; \
  62962   uint64_t __s1 = __p1; \
  62963   __ret = (uint64_t) __builtin_neon_vsrid_n_u64(__s0, __s1, __p2); \
  62964   __ret; \
  62965 })
  62966 #define vsrid_n_s64(__p0, __p1, __p2) __extension__ ({ \
  62967   int64_t __ret; \
  62968   int64_t __s0 = __p0; \
  62969   int64_t __s1 = __p1; \
  62970   __ret = (int64_t) __builtin_neon_vsrid_n_s64(__s0, __s1, __p2); \
  62971   __ret; \
  62972 })
  62973 #define vsri_n_p64(__p0, __p1, __p2) __extension__ ({ \
  62974   poly64x1_t __ret; \
  62975   poly64x1_t __s0 = __p0; \
  62976   poly64x1_t __s1 = __p1; \
  62977   __ret = (poly64x1_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 6); \
  62978   __ret; \
  62979 })
  62980 #ifdef __LITTLE_ENDIAN__
  62981 #define vsriq_n_p64(__p0, __p1, __p2) __extension__ ({ \
  62982   poly64x2_t __ret; \
  62983   poly64x2_t __s0 = __p0; \
  62984   poly64x2_t __s1 = __p1; \
  62985   __ret = (poly64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 38); \
  62986   __ret; \
  62987 })
  62988 #else
  62989 #define vsriq_n_p64(__p0, __p1, __p2) __extension__ ({ \
  62990   poly64x2_t __ret; \
  62991   poly64x2_t __s0 = __p0; \
  62992   poly64x2_t __s1 = __p1; \
  62993   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  62994   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  62995   __ret = (poly64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 38); \
  62996   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  62997   __ret; \
  62998 })
  62999 #endif
  63000 
  63001 #define vst1_p64(__p0, __p1) __extension__ ({ \
  63002   poly64x1_t __s1 = __p1; \
  63003   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 6); \
  63004 })
  63005 #ifdef __LITTLE_ENDIAN__
  63006 #define vst1q_p64(__p0, __p1) __extension__ ({ \
  63007   poly64x2_t __s1 = __p1; \
  63008   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 38); \
  63009 })
  63010 #else
  63011 #define vst1q_p64(__p0, __p1) __extension__ ({ \
  63012   poly64x2_t __s1 = __p1; \
  63013   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  63014   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 38); \
  63015 })
  63016 #endif
  63017 
  63018 #ifdef __LITTLE_ENDIAN__
  63019 #define vst1q_f64(__p0, __p1) __extension__ ({ \
  63020   float64x2_t __s1 = __p1; \
  63021   __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 42); \
  63022 })
  63023 #else
  63024 #define vst1q_f64(__p0, __p1) __extension__ ({ \
  63025   float64x2_t __s1 = __p1; \
  63026   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  63027   __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 42); \
  63028 })
  63029 #endif
  63030 
  63031 #define vst1_f64(__p0, __p1) __extension__ ({ \
  63032   float64x1_t __s1 = __p1; \
  63033   __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 10); \
  63034 })
  63035 #define vst1_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63036   poly64x1_t __s1 = __p1; \
  63037   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 6); \
  63038 })
  63039 #ifdef __LITTLE_ENDIAN__
  63040 #define vst1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63041   poly64x2_t __s1 = __p1; \
  63042   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 38); \
  63043 })
  63044 #else
  63045 #define vst1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63046   poly64x2_t __s1 = __p1; \
  63047   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  63048   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 38); \
  63049 })
  63050 #endif
  63051 
  63052 #ifdef __LITTLE_ENDIAN__
  63053 #define vst1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63054   float64x2_t __s1 = __p1; \
  63055   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 42); \
  63056 })
  63057 #else
  63058 #define vst1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63059   float64x2_t __s1 = __p1; \
  63060   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  63061   __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 42); \
  63062 })
  63063 #endif
  63064 
  63065 #define vst1_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63066   float64x1_t __s1 = __p1; \
  63067   __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 10); \
  63068 })
  63069 #define vst1_p64_x2(__p0, __p1) __extension__ ({ \
  63070   poly64x1x2_t __s1 = __p1; \
  63071   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 6); \
  63072 })
  63073 #ifdef __LITTLE_ENDIAN__
  63074 #define vst1q_p64_x2(__p0, __p1) __extension__ ({ \
  63075   poly64x2x2_t __s1 = __p1; \
  63076   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 38); \
  63077 })
  63078 #else
  63079 #define vst1q_p64_x2(__p0, __p1) __extension__ ({ \
  63080   poly64x2x2_t __s1 = __p1; \
  63081   poly64x2x2_t __rev1; \
  63082   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63083   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63084   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 38); \
  63085 })
  63086 #endif
  63087 
  63088 #ifdef __LITTLE_ENDIAN__
  63089 #define vst1q_f64_x2(__p0, __p1) __extension__ ({ \
  63090   float64x2x2_t __s1 = __p1; \
  63091   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 42); \
  63092 })
  63093 #else
  63094 #define vst1q_f64_x2(__p0, __p1) __extension__ ({ \
  63095   float64x2x2_t __s1 = __p1; \
  63096   float64x2x2_t __rev1; \
  63097   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63098   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63099   __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 42); \
  63100 })
  63101 #endif
  63102 
  63103 #define vst1_f64_x2(__p0, __p1) __extension__ ({ \
  63104   float64x1x2_t __s1 = __p1; \
  63105   __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 10); \
  63106 })
  63107 #define vst1_p64_x3(__p0, __p1) __extension__ ({ \
  63108   poly64x1x3_t __s1 = __p1; \
  63109   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 6); \
  63110 })
  63111 #ifdef __LITTLE_ENDIAN__
  63112 #define vst1q_p64_x3(__p0, __p1) __extension__ ({ \
  63113   poly64x2x3_t __s1 = __p1; \
  63114   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 38); \
  63115 })
  63116 #else
  63117 #define vst1q_p64_x3(__p0, __p1) __extension__ ({ \
  63118   poly64x2x3_t __s1 = __p1; \
  63119   poly64x2x3_t __rev1; \
  63120   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63121   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63122   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63123   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 38); \
  63124 })
  63125 #endif
  63126 
  63127 #ifdef __LITTLE_ENDIAN__
  63128 #define vst1q_f64_x3(__p0, __p1) __extension__ ({ \
  63129   float64x2x3_t __s1 = __p1; \
  63130   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 42); \
  63131 })
  63132 #else
  63133 #define vst1q_f64_x3(__p0, __p1) __extension__ ({ \
  63134   float64x2x3_t __s1 = __p1; \
  63135   float64x2x3_t __rev1; \
  63136   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63137   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63138   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63139   __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 42); \
  63140 })
  63141 #endif
  63142 
  63143 #define vst1_f64_x3(__p0, __p1) __extension__ ({ \
  63144   float64x1x3_t __s1 = __p1; \
  63145   __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 10); \
  63146 })
  63147 #define vst1_p64_x4(__p0, __p1) __extension__ ({ \
  63148   poly64x1x4_t __s1 = __p1; \
  63149   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 6); \
  63150 })
  63151 #ifdef __LITTLE_ENDIAN__
  63152 #define vst1q_p64_x4(__p0, __p1) __extension__ ({ \
  63153   poly64x2x4_t __s1 = __p1; \
  63154   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 38); \
  63155 })
  63156 #else
  63157 #define vst1q_p64_x4(__p0, __p1) __extension__ ({ \
  63158   poly64x2x4_t __s1 = __p1; \
  63159   poly64x2x4_t __rev1; \
  63160   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63161   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63162   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63163   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63164   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 38); \
  63165 })
  63166 #endif
  63167 
  63168 #ifdef __LITTLE_ENDIAN__
  63169 #define vst1q_f64_x4(__p0, __p1) __extension__ ({ \
  63170   float64x2x4_t __s1 = __p1; \
  63171   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 42); \
  63172 })
  63173 #else
  63174 #define vst1q_f64_x4(__p0, __p1) __extension__ ({ \
  63175   float64x2x4_t __s1 = __p1; \
  63176   float64x2x4_t __rev1; \
  63177   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63178   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63179   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63180   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63181   __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 42); \
  63182 })
  63183 #endif
  63184 
  63185 #define vst1_f64_x4(__p0, __p1) __extension__ ({ \
  63186   float64x1x4_t __s1 = __p1; \
  63187   __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 10); \
  63188 })
  63189 #define vst2_p64(__p0, __p1) __extension__ ({ \
  63190   poly64x1x2_t __s1 = __p1; \
  63191   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 6); \
  63192 })
  63193 #ifdef __LITTLE_ENDIAN__
  63194 #define vst2q_p64(__p0, __p1) __extension__ ({ \
  63195   poly64x2x2_t __s1 = __p1; \
  63196   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 38); \
  63197 })
  63198 #else
  63199 #define vst2q_p64(__p0, __p1) __extension__ ({ \
  63200   poly64x2x2_t __s1 = __p1; \
  63201   poly64x2x2_t __rev1; \
  63202   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63203   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63204   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 38); \
  63205 })
  63206 #endif
  63207 
  63208 #ifdef __LITTLE_ENDIAN__
  63209 #define vst2q_u64(__p0, __p1) __extension__ ({ \
  63210   uint64x2x2_t __s1 = __p1; \
  63211   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 51); \
  63212 })
  63213 #else
  63214 #define vst2q_u64(__p0, __p1) __extension__ ({ \
  63215   uint64x2x2_t __s1 = __p1; \
  63216   uint64x2x2_t __rev1; \
  63217   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63218   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63219   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 51); \
  63220 })
  63221 #endif
  63222 
  63223 #ifdef __LITTLE_ENDIAN__
  63224 #define vst2q_f64(__p0, __p1) __extension__ ({ \
  63225   float64x2x2_t __s1 = __p1; \
  63226   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 42); \
  63227 })
  63228 #else
  63229 #define vst2q_f64(__p0, __p1) __extension__ ({ \
  63230   float64x2x2_t __s1 = __p1; \
  63231   float64x2x2_t __rev1; \
  63232   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63233   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63234   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 42); \
  63235 })
  63236 #endif
  63237 
  63238 #ifdef __LITTLE_ENDIAN__
  63239 #define vst2q_s64(__p0, __p1) __extension__ ({ \
  63240   int64x2x2_t __s1 = __p1; \
  63241   __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 35); \
  63242 })
  63243 #else
  63244 #define vst2q_s64(__p0, __p1) __extension__ ({ \
  63245   int64x2x2_t __s1 = __p1; \
  63246   int64x2x2_t __rev1; \
  63247   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63248   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63249   __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 35); \
  63250 })
  63251 #endif
  63252 
  63253 #define vst2_f64(__p0, __p1) __extension__ ({ \
  63254   float64x1x2_t __s1 = __p1; \
  63255   __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 10); \
  63256 })
  63257 #define vst2_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63258   poly64x1x2_t __s1 = __p1; \
  63259   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 6); \
  63260 })
  63261 #ifdef __LITTLE_ENDIAN__
  63262 #define vst2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  63263   poly8x16x2_t __s1 = __p1; \
  63264   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 36); \
  63265 })
  63266 #else
  63267 #define vst2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  63268   poly8x16x2_t __s1 = __p1; \
  63269   poly8x16x2_t __rev1; \
  63270   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63271   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63272   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 36); \
  63273 })
  63274 #endif
  63275 
  63276 #ifdef __LITTLE_ENDIAN__
  63277 #define vst2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63278   poly64x2x2_t __s1 = __p1; \
  63279   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 38); \
  63280 })
  63281 #else
  63282 #define vst2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63283   poly64x2x2_t __s1 = __p1; \
  63284   poly64x2x2_t __rev1; \
  63285   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63286   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63287   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 38); \
  63288 })
  63289 #endif
  63290 
  63291 #ifdef __LITTLE_ENDIAN__
  63292 #define vst2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  63293   uint8x16x2_t __s1 = __p1; \
  63294   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 48); \
  63295 })
  63296 #else
  63297 #define vst2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  63298   uint8x16x2_t __s1 = __p1; \
  63299   uint8x16x2_t __rev1; \
  63300   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63301   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63302   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 48); \
  63303 })
  63304 #endif
  63305 
  63306 #ifdef __LITTLE_ENDIAN__
  63307 #define vst2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63308   uint64x2x2_t __s1 = __p1; \
  63309   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 51); \
  63310 })
  63311 #else
  63312 #define vst2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63313   uint64x2x2_t __s1 = __p1; \
  63314   uint64x2x2_t __rev1; \
  63315   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63316   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63317   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 51); \
  63318 })
  63319 #endif
  63320 
  63321 #ifdef __LITTLE_ENDIAN__
  63322 #define vst2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  63323   int8x16x2_t __s1 = __p1; \
  63324   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 32); \
  63325 })
  63326 #else
  63327 #define vst2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  63328   int8x16x2_t __s1 = __p1; \
  63329   int8x16x2_t __rev1; \
  63330   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63331   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63332   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 32); \
  63333 })
  63334 #endif
  63335 
  63336 #ifdef __LITTLE_ENDIAN__
  63337 #define vst2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63338   float64x2x2_t __s1 = __p1; \
  63339   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 42); \
  63340 })
  63341 #else
  63342 #define vst2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63343   float64x2x2_t __s1 = __p1; \
  63344   float64x2x2_t __rev1; \
  63345   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63346   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63347   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 42); \
  63348 })
  63349 #endif
  63350 
  63351 #ifdef __LITTLE_ENDIAN__
  63352 #define vst2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63353   int64x2x2_t __s1 = __p1; \
  63354   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 35); \
  63355 })
  63356 #else
  63357 #define vst2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63358   int64x2x2_t __s1 = __p1; \
  63359   int64x2x2_t __rev1; \
  63360   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63361   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63362   __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 35); \
  63363 })
  63364 #endif
  63365 
  63366 #define vst2_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63367   uint64x1x2_t __s1 = __p1; \
  63368   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 19); \
  63369 })
  63370 #define vst2_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63371   float64x1x2_t __s1 = __p1; \
  63372   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 10); \
  63373 })
  63374 #define vst2_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63375   int64x1x2_t __s1 = __p1; \
  63376   __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 3); \
  63377 })
  63378 #define vst3_p64(__p0, __p1) __extension__ ({ \
  63379   poly64x1x3_t __s1 = __p1; \
  63380   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 6); \
  63381 })
  63382 #ifdef __LITTLE_ENDIAN__
  63383 #define vst3q_p64(__p0, __p1) __extension__ ({ \
  63384   poly64x2x3_t __s1 = __p1; \
  63385   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 38); \
  63386 })
  63387 #else
  63388 #define vst3q_p64(__p0, __p1) __extension__ ({ \
  63389   poly64x2x3_t __s1 = __p1; \
  63390   poly64x2x3_t __rev1; \
  63391   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63392   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63393   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63394   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 38); \
  63395 })
  63396 #endif
  63397 
  63398 #ifdef __LITTLE_ENDIAN__
  63399 #define vst3q_u64(__p0, __p1) __extension__ ({ \
  63400   uint64x2x3_t __s1 = __p1; \
  63401   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 51); \
  63402 })
  63403 #else
  63404 #define vst3q_u64(__p0, __p1) __extension__ ({ \
  63405   uint64x2x3_t __s1 = __p1; \
  63406   uint64x2x3_t __rev1; \
  63407   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63408   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63409   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63410   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 51); \
  63411 })
  63412 #endif
  63413 
  63414 #ifdef __LITTLE_ENDIAN__
  63415 #define vst3q_f64(__p0, __p1) __extension__ ({ \
  63416   float64x2x3_t __s1 = __p1; \
  63417   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 42); \
  63418 })
  63419 #else
  63420 #define vst3q_f64(__p0, __p1) __extension__ ({ \
  63421   float64x2x3_t __s1 = __p1; \
  63422   float64x2x3_t __rev1; \
  63423   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63424   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63425   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63426   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 42); \
  63427 })
  63428 #endif
  63429 
  63430 #ifdef __LITTLE_ENDIAN__
  63431 #define vst3q_s64(__p0, __p1) __extension__ ({ \
  63432   int64x2x3_t __s1 = __p1; \
  63433   __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 35); \
  63434 })
  63435 #else
  63436 #define vst3q_s64(__p0, __p1) __extension__ ({ \
  63437   int64x2x3_t __s1 = __p1; \
  63438   int64x2x3_t __rev1; \
  63439   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63440   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63441   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63442   __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 35); \
  63443 })
  63444 #endif
  63445 
  63446 #define vst3_f64(__p0, __p1) __extension__ ({ \
  63447   float64x1x3_t __s1 = __p1; \
  63448   __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 10); \
  63449 })
  63450 #define vst3_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63451   poly64x1x3_t __s1 = __p1; \
  63452   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 6); \
  63453 })
  63454 #ifdef __LITTLE_ENDIAN__
  63455 #define vst3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  63456   poly8x16x3_t __s1 = __p1; \
  63457   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 36); \
  63458 })
  63459 #else
  63460 #define vst3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  63461   poly8x16x3_t __s1 = __p1; \
  63462   poly8x16x3_t __rev1; \
  63463   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63464   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63465   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63466   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 36); \
  63467 })
  63468 #endif
  63469 
  63470 #ifdef __LITTLE_ENDIAN__
  63471 #define vst3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63472   poly64x2x3_t __s1 = __p1; \
  63473   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 38); \
  63474 })
  63475 #else
  63476 #define vst3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63477   poly64x2x3_t __s1 = __p1; \
  63478   poly64x2x3_t __rev1; \
  63479   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63480   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63481   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63482   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 38); \
  63483 })
  63484 #endif
  63485 
  63486 #ifdef __LITTLE_ENDIAN__
  63487 #define vst3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  63488   uint8x16x3_t __s1 = __p1; \
  63489   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 48); \
  63490 })
  63491 #else
  63492 #define vst3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  63493   uint8x16x3_t __s1 = __p1; \
  63494   uint8x16x3_t __rev1; \
  63495   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63496   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63497   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63498   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 48); \
  63499 })
  63500 #endif
  63501 
  63502 #ifdef __LITTLE_ENDIAN__
  63503 #define vst3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63504   uint64x2x3_t __s1 = __p1; \
  63505   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 51); \
  63506 })
  63507 #else
  63508 #define vst3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63509   uint64x2x3_t __s1 = __p1; \
  63510   uint64x2x3_t __rev1; \
  63511   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63512   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63513   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63514   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 51); \
  63515 })
  63516 #endif
  63517 
  63518 #ifdef __LITTLE_ENDIAN__
  63519 #define vst3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  63520   int8x16x3_t __s1 = __p1; \
  63521   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 32); \
  63522 })
  63523 #else
  63524 #define vst3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  63525   int8x16x3_t __s1 = __p1; \
  63526   int8x16x3_t __rev1; \
  63527   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63528   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63529   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63530   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 32); \
  63531 })
  63532 #endif
  63533 
  63534 #ifdef __LITTLE_ENDIAN__
  63535 #define vst3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63536   float64x2x3_t __s1 = __p1; \
  63537   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 42); \
  63538 })
  63539 #else
  63540 #define vst3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63541   float64x2x3_t __s1 = __p1; \
  63542   float64x2x3_t __rev1; \
  63543   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63544   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63545   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63546   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 42); \
  63547 })
  63548 #endif
  63549 
  63550 #ifdef __LITTLE_ENDIAN__
  63551 #define vst3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63552   int64x2x3_t __s1 = __p1; \
  63553   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 35); \
  63554 })
  63555 #else
  63556 #define vst3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63557   int64x2x3_t __s1 = __p1; \
  63558   int64x2x3_t __rev1; \
  63559   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63560   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63561   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63562   __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 35); \
  63563 })
  63564 #endif
  63565 
  63566 #define vst3_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63567   uint64x1x3_t __s1 = __p1; \
  63568   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 19); \
  63569 })
  63570 #define vst3_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63571   float64x1x3_t __s1 = __p1; \
  63572   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 10); \
  63573 })
  63574 #define vst3_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63575   int64x1x3_t __s1 = __p1; \
  63576   __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 3); \
  63577 })
  63578 #define vst4_p64(__p0, __p1) __extension__ ({ \
  63579   poly64x1x4_t __s1 = __p1; \
  63580   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 6); \
  63581 })
  63582 #ifdef __LITTLE_ENDIAN__
  63583 #define vst4q_p64(__p0, __p1) __extension__ ({ \
  63584   poly64x2x4_t __s1 = __p1; \
  63585   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 38); \
  63586 })
  63587 #else
  63588 #define vst4q_p64(__p0, __p1) __extension__ ({ \
  63589   poly64x2x4_t __s1 = __p1; \
  63590   poly64x2x4_t __rev1; \
  63591   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63592   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63593   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63594   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63595   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 38); \
  63596 })
  63597 #endif
  63598 
  63599 #ifdef __LITTLE_ENDIAN__
  63600 #define vst4q_u64(__p0, __p1) __extension__ ({ \
  63601   uint64x2x4_t __s1 = __p1; \
  63602   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 51); \
  63603 })
  63604 #else
  63605 #define vst4q_u64(__p0, __p1) __extension__ ({ \
  63606   uint64x2x4_t __s1 = __p1; \
  63607   uint64x2x4_t __rev1; \
  63608   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63609   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63610   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63611   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63612   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 51); \
  63613 })
  63614 #endif
  63615 
  63616 #ifdef __LITTLE_ENDIAN__
  63617 #define vst4q_f64(__p0, __p1) __extension__ ({ \
  63618   float64x2x4_t __s1 = __p1; \
  63619   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 42); \
  63620 })
  63621 #else
  63622 #define vst4q_f64(__p0, __p1) __extension__ ({ \
  63623   float64x2x4_t __s1 = __p1; \
  63624   float64x2x4_t __rev1; \
  63625   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63626   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63627   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63628   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63629   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 42); \
  63630 })
  63631 #endif
  63632 
  63633 #ifdef __LITTLE_ENDIAN__
  63634 #define vst4q_s64(__p0, __p1) __extension__ ({ \
  63635   int64x2x4_t __s1 = __p1; \
  63636   __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 35); \
  63637 })
  63638 #else
  63639 #define vst4q_s64(__p0, __p1) __extension__ ({ \
  63640   int64x2x4_t __s1 = __p1; \
  63641   int64x2x4_t __rev1; \
  63642   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63643   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63644   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63645   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63646   __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 35); \
  63647 })
  63648 #endif
  63649 
  63650 #define vst4_f64(__p0, __p1) __extension__ ({ \
  63651   float64x1x4_t __s1 = __p1; \
  63652   __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 10); \
  63653 })
  63654 #define vst4_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63655   poly64x1x4_t __s1 = __p1; \
  63656   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 6); \
  63657 })
  63658 #ifdef __LITTLE_ENDIAN__
  63659 #define vst4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  63660   poly8x16x4_t __s1 = __p1; \
  63661   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 36); \
  63662 })
  63663 #else
  63664 #define vst4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \
  63665   poly8x16x4_t __s1 = __p1; \
  63666   poly8x16x4_t __rev1; \
  63667   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63668   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63669   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63670   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63671   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 36); \
  63672 })
  63673 #endif
  63674 
  63675 #ifdef __LITTLE_ENDIAN__
  63676 #define vst4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63677   poly64x2x4_t __s1 = __p1; \
  63678   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 38); \
  63679 })
  63680 #else
  63681 #define vst4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  63682   poly64x2x4_t __s1 = __p1; \
  63683   poly64x2x4_t __rev1; \
  63684   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63685   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63686   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63687   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63688   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 38); \
  63689 })
  63690 #endif
  63691 
  63692 #ifdef __LITTLE_ENDIAN__
  63693 #define vst4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  63694   uint8x16x4_t __s1 = __p1; \
  63695   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 48); \
  63696 })
  63697 #else
  63698 #define vst4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \
  63699   uint8x16x4_t __s1 = __p1; \
  63700   uint8x16x4_t __rev1; \
  63701   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63702   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63703   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63704   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63705   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 48); \
  63706 })
  63707 #endif
  63708 
  63709 #ifdef __LITTLE_ENDIAN__
  63710 #define vst4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63711   uint64x2x4_t __s1 = __p1; \
  63712   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 51); \
  63713 })
  63714 #else
  63715 #define vst4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63716   uint64x2x4_t __s1 = __p1; \
  63717   uint64x2x4_t __rev1; \
  63718   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63719   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63720   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63721   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63722   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 51); \
  63723 })
  63724 #endif
  63725 
  63726 #ifdef __LITTLE_ENDIAN__
  63727 #define vst4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  63728   int8x16x4_t __s1 = __p1; \
  63729   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 32); \
  63730 })
  63731 #else
  63732 #define vst4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \
  63733   int8x16x4_t __s1 = __p1; \
  63734   int8x16x4_t __rev1; \
  63735   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63736   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63737   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63738   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  63739   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 32); \
  63740 })
  63741 #endif
  63742 
  63743 #ifdef __LITTLE_ENDIAN__
  63744 #define vst4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63745   float64x2x4_t __s1 = __p1; \
  63746   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 42); \
  63747 })
  63748 #else
  63749 #define vst4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63750   float64x2x4_t __s1 = __p1; \
  63751   float64x2x4_t __rev1; \
  63752   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63753   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63754   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63755   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63756   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 42); \
  63757 })
  63758 #endif
  63759 
  63760 #ifdef __LITTLE_ENDIAN__
  63761 #define vst4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63762   int64x2x4_t __s1 = __p1; \
  63763   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 35); \
  63764 })
  63765 #else
  63766 #define vst4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63767   int64x2x4_t __s1 = __p1; \
  63768   int64x2x4_t __rev1; \
  63769   __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \
  63770   __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \
  63771   __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \
  63772   __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \
  63773   __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 35); \
  63774 })
  63775 #endif
  63776 
  63777 #define vst4_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  63778   uint64x1x4_t __s1 = __p1; \
  63779   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 19); \
  63780 })
  63781 #define vst4_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  63782   float64x1x4_t __s1 = __p1; \
  63783   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 10); \
  63784 })
  63785 #define vst4_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  63786   int64x1x4_t __s1 = __p1; \
  63787   __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 3); \
  63788 })
  63789 #define vstrq_p128(__p0, __p1) __extension__ ({ \
  63790   poly128_t __s1 = __p1; \
  63791   __builtin_neon_vstrq_p128(__p0, __s1); \
  63792 })
  63793 __ai __attribute__((target("neon"))) uint64_t vsubd_u64(uint64_t __p0, uint64_t __p1) {
  63794   uint64_t __ret;
  63795   __ret = (uint64_t) __builtin_neon_vsubd_u64(__p0, __p1);
  63796   return __ret;
  63797 }
  63798 __ai __attribute__((target("neon"))) int64_t vsubd_s64(int64_t __p0, int64_t __p1) {
  63799   int64_t __ret;
  63800   __ret = (int64_t) __builtin_neon_vsubd_s64(__p0, __p1);
  63801   return __ret;
  63802 }
  63803 #ifdef __LITTLE_ENDIAN__
  63804 __ai __attribute__((target("neon"))) float64x2_t vsubq_f64(float64x2_t __p0, float64x2_t __p1) {
  63805   float64x2_t __ret;
  63806   __ret = __p0 - __p1;
  63807   return __ret;
  63808 }
  63809 #else
  63810 __ai __attribute__((target("neon"))) float64x2_t vsubq_f64(float64x2_t __p0, float64x2_t __p1) {
  63811   float64x2_t __ret;
  63812   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  63813   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  63814   __ret = __rev0 - __rev1;
  63815   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  63816   return __ret;
  63817 }
  63818 #endif
  63819 
  63820 __ai __attribute__((target("neon"))) float64x1_t vsub_f64(float64x1_t __p0, float64x1_t __p1) {
  63821   float64x1_t __ret;
  63822   __ret = __p0 - __p1;
  63823   return __ret;
  63824 }
  63825 #ifdef __LITTLE_ENDIAN__
  63826 __ai __attribute__((target("neon"))) uint16x8_t vsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  63827   uint16x8_t __ret;
  63828   __ret = vcombine_u16(__p0, vsubhn_u32(__p1, __p2));
  63829   return __ret;
  63830 }
  63831 #else
  63832 __ai __attribute__((target("neon"))) uint16x8_t vsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  63833   uint16x8_t __ret;
  63834   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  63835   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  63836   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  63837   __ret = __noswap_vcombine_u16(__rev0, __noswap_vsubhn_u32(__rev1, __rev2));
  63838   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  63839   return __ret;
  63840 }
  63841 #endif
  63842 
  63843 #ifdef __LITTLE_ENDIAN__
  63844 __ai __attribute__((target("neon"))) uint32x4_t vsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  63845   uint32x4_t __ret;
  63846   __ret = vcombine_u32(__p0, vsubhn_u64(__p1, __p2));
  63847   return __ret;
  63848 }
  63849 #else
  63850 __ai __attribute__((target("neon"))) uint32x4_t vsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  63851   uint32x4_t __ret;
  63852   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  63853   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  63854   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  63855   __ret = __noswap_vcombine_u32(__rev0, __noswap_vsubhn_u64(__rev1, __rev2));
  63856   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  63857   return __ret;
  63858 }
  63859 #endif
  63860 
  63861 #ifdef __LITTLE_ENDIAN__
  63862 __ai __attribute__((target("neon"))) uint8x16_t vsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  63863   uint8x16_t __ret;
  63864   __ret = vcombine_u8(__p0, vsubhn_u16(__p1, __p2));
  63865   return __ret;
  63866 }
  63867 #else
  63868 __ai __attribute__((target("neon"))) uint8x16_t vsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  63869   uint8x16_t __ret;
  63870   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  63871   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  63872   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  63873   __ret = __noswap_vcombine_u8(__rev0, __noswap_vsubhn_u16(__rev1, __rev2));
  63874   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  63875   return __ret;
  63876 }
  63877 #endif
  63878 
  63879 #ifdef __LITTLE_ENDIAN__
  63880 __ai __attribute__((target("neon"))) int16x8_t vsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  63881   int16x8_t __ret;
  63882   __ret = vcombine_s16(__p0, vsubhn_s32(__p1, __p2));
  63883   return __ret;
  63884 }
  63885 #else
  63886 __ai __attribute__((target("neon"))) int16x8_t vsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  63887   int16x8_t __ret;
  63888   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  63889   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  63890   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  63891   __ret = __noswap_vcombine_s16(__rev0, __noswap_vsubhn_s32(__rev1, __rev2));
  63892   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  63893   return __ret;
  63894 }
  63895 #endif
  63896 
  63897 #ifdef __LITTLE_ENDIAN__
  63898 __ai __attribute__((target("neon"))) int32x4_t vsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  63899   int32x4_t __ret;
  63900   __ret = vcombine_s32(__p0, vsubhn_s64(__p1, __p2));
  63901   return __ret;
  63902 }
  63903 #else
  63904 __ai __attribute__((target("neon"))) int32x4_t vsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  63905   int32x4_t __ret;
  63906   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  63907   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  63908   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  63909   __ret = __noswap_vcombine_s32(__rev0, __noswap_vsubhn_s64(__rev1, __rev2));
  63910   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  63911   return __ret;
  63912 }
  63913 #endif
  63914 
  63915 #ifdef __LITTLE_ENDIAN__
  63916 __ai __attribute__((target("neon"))) int8x16_t vsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  63917   int8x16_t __ret;
  63918   __ret = vcombine_s8(__p0, vsubhn_s16(__p1, __p2));
  63919   return __ret;
  63920 }
  63921 #else
  63922 __ai __attribute__((target("neon"))) int8x16_t vsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  63923   int8x16_t __ret;
  63924   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  63925   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  63926   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  63927   __ret = __noswap_vcombine_s8(__rev0, __noswap_vsubhn_s16(__rev1, __rev2));
  63928   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  63929   return __ret;
  63930 }
  63931 #endif
  63932 
  63933 #ifdef __LITTLE_ENDIAN__
  63934 __ai __attribute__((target("neon"))) uint16x8_t vsubl_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  63935   uint16x8_t __ret;
  63936   __ret = vmovl_high_u8(__p0) - vmovl_high_u8(__p1);
  63937   return __ret;
  63938 }
  63939 #else
  63940 __ai __attribute__((target("neon"))) uint16x8_t vsubl_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  63941   uint16x8_t __ret;
  63942   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  63943   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  63944   __ret = __noswap_vmovl_high_u8(__rev0) - __noswap_vmovl_high_u8(__rev1);
  63945   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  63946   return __ret;
  63947 }
  63948 #endif
  63949 
  63950 #ifdef __LITTLE_ENDIAN__
  63951 __ai __attribute__((target("neon"))) uint64x2_t vsubl_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  63952   uint64x2_t __ret;
  63953   __ret = vmovl_high_u32(__p0) - vmovl_high_u32(__p1);
  63954   return __ret;
  63955 }
  63956 #else
  63957 __ai __attribute__((target("neon"))) uint64x2_t vsubl_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  63958   uint64x2_t __ret;
  63959   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  63960   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  63961   __ret = __noswap_vmovl_high_u32(__rev0) - __noswap_vmovl_high_u32(__rev1);
  63962   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  63963   return __ret;
  63964 }
  63965 #endif
  63966 
  63967 #ifdef __LITTLE_ENDIAN__
  63968 __ai __attribute__((target("neon"))) uint32x4_t vsubl_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  63969   uint32x4_t __ret;
  63970   __ret = vmovl_high_u16(__p0) - vmovl_high_u16(__p1);
  63971   return __ret;
  63972 }
  63973 #else
  63974 __ai __attribute__((target("neon"))) uint32x4_t vsubl_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  63975   uint32x4_t __ret;
  63976   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  63977   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  63978   __ret = __noswap_vmovl_high_u16(__rev0) - __noswap_vmovl_high_u16(__rev1);
  63979   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  63980   return __ret;
  63981 }
  63982 #endif
  63983 
  63984 #ifdef __LITTLE_ENDIAN__
  63985 __ai __attribute__((target("neon"))) int16x8_t vsubl_high_s8(int8x16_t __p0, int8x16_t __p1) {
  63986   int16x8_t __ret;
  63987   __ret = vmovl_high_s8(__p0) - vmovl_high_s8(__p1);
  63988   return __ret;
  63989 }
  63990 #else
  63991 __ai __attribute__((target("neon"))) int16x8_t vsubl_high_s8(int8x16_t __p0, int8x16_t __p1) {
  63992   int16x8_t __ret;
  63993   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  63994   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  63995   __ret = __noswap_vmovl_high_s8(__rev0) - __noswap_vmovl_high_s8(__rev1);
  63996   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  63997   return __ret;
  63998 }
  63999 #endif
  64000 
  64001 #ifdef __LITTLE_ENDIAN__
  64002 __ai __attribute__((target("neon"))) int64x2_t vsubl_high_s32(int32x4_t __p0, int32x4_t __p1) {
  64003   int64x2_t __ret;
  64004   __ret = vmovl_high_s32(__p0) - vmovl_high_s32(__p1);
  64005   return __ret;
  64006 }
  64007 #else
  64008 __ai __attribute__((target("neon"))) int64x2_t vsubl_high_s32(int32x4_t __p0, int32x4_t __p1) {
  64009   int64x2_t __ret;
  64010   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64011   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64012   __ret = __noswap_vmovl_high_s32(__rev0) - __noswap_vmovl_high_s32(__rev1);
  64013   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64014   return __ret;
  64015 }
  64016 #endif
  64017 
  64018 #ifdef __LITTLE_ENDIAN__
  64019 __ai __attribute__((target("neon"))) int32x4_t vsubl_high_s16(int16x8_t __p0, int16x8_t __p1) {
  64020   int32x4_t __ret;
  64021   __ret = vmovl_high_s16(__p0) - vmovl_high_s16(__p1);
  64022   return __ret;
  64023 }
  64024 #else
  64025 __ai __attribute__((target("neon"))) int32x4_t vsubl_high_s16(int16x8_t __p0, int16x8_t __p1) {
  64026   int32x4_t __ret;
  64027   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64028   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64029   __ret = __noswap_vmovl_high_s16(__rev0) - __noswap_vmovl_high_s16(__rev1);
  64030   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64031   return __ret;
  64032 }
  64033 #endif
  64034 
  64035 #ifdef __LITTLE_ENDIAN__
  64036 __ai __attribute__((target("neon"))) uint16x8_t vsubw_high_u8(uint16x8_t __p0, uint8x16_t __p1) {
  64037   uint16x8_t __ret;
  64038   __ret = __p0 - vmovl_high_u8(__p1);
  64039   return __ret;
  64040 }
  64041 #else
  64042 __ai __attribute__((target("neon"))) uint16x8_t vsubw_high_u8(uint16x8_t __p0, uint8x16_t __p1) {
  64043   uint16x8_t __ret;
  64044   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64045   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64046   __ret = __rev0 - __noswap_vmovl_high_u8(__rev1);
  64047   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64048   return __ret;
  64049 }
  64050 #endif
  64051 
  64052 #ifdef __LITTLE_ENDIAN__
  64053 __ai __attribute__((target("neon"))) uint64x2_t vsubw_high_u32(uint64x2_t __p0, uint32x4_t __p1) {
  64054   uint64x2_t __ret;
  64055   __ret = __p0 - vmovl_high_u32(__p1);
  64056   return __ret;
  64057 }
  64058 #else
  64059 __ai __attribute__((target("neon"))) uint64x2_t vsubw_high_u32(uint64x2_t __p0, uint32x4_t __p1) {
  64060   uint64x2_t __ret;
  64061   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64062   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64063   __ret = __rev0 - __noswap_vmovl_high_u32(__rev1);
  64064   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64065   return __ret;
  64066 }
  64067 #endif
  64068 
  64069 #ifdef __LITTLE_ENDIAN__
  64070 __ai __attribute__((target("neon"))) uint32x4_t vsubw_high_u16(uint32x4_t __p0, uint16x8_t __p1) {
  64071   uint32x4_t __ret;
  64072   __ret = __p0 - vmovl_high_u16(__p1);
  64073   return __ret;
  64074 }
  64075 #else
  64076 __ai __attribute__((target("neon"))) uint32x4_t vsubw_high_u16(uint32x4_t __p0, uint16x8_t __p1) {
  64077   uint32x4_t __ret;
  64078   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64079   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64080   __ret = __rev0 - __noswap_vmovl_high_u16(__rev1);
  64081   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64082   return __ret;
  64083 }
  64084 #endif
  64085 
  64086 #ifdef __LITTLE_ENDIAN__
  64087 __ai __attribute__((target("neon"))) int16x8_t vsubw_high_s8(int16x8_t __p0, int8x16_t __p1) {
  64088   int16x8_t __ret;
  64089   __ret = __p0 - vmovl_high_s8(__p1);
  64090   return __ret;
  64091 }
  64092 #else
  64093 __ai __attribute__((target("neon"))) int16x8_t vsubw_high_s8(int16x8_t __p0, int8x16_t __p1) {
  64094   int16x8_t __ret;
  64095   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64096   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64097   __ret = __rev0 - __noswap_vmovl_high_s8(__rev1);
  64098   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64099   return __ret;
  64100 }
  64101 #endif
  64102 
  64103 #ifdef __LITTLE_ENDIAN__
  64104 __ai __attribute__((target("neon"))) int64x2_t vsubw_high_s32(int64x2_t __p0, int32x4_t __p1) {
  64105   int64x2_t __ret;
  64106   __ret = __p0 - vmovl_high_s32(__p1);
  64107   return __ret;
  64108 }
  64109 #else
  64110 __ai __attribute__((target("neon"))) int64x2_t vsubw_high_s32(int64x2_t __p0, int32x4_t __p1) {
  64111   int64x2_t __ret;
  64112   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64113   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64114   __ret = __rev0 - __noswap_vmovl_high_s32(__rev1);
  64115   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64116   return __ret;
  64117 }
  64118 #endif
  64119 
  64120 #ifdef __LITTLE_ENDIAN__
  64121 __ai __attribute__((target("neon"))) int32x4_t vsubw_high_s16(int32x4_t __p0, int16x8_t __p1) {
  64122   int32x4_t __ret;
  64123   __ret = __p0 - vmovl_high_s16(__p1);
  64124   return __ret;
  64125 }
  64126 #else
  64127 __ai __attribute__((target("neon"))) int32x4_t vsubw_high_s16(int32x4_t __p0, int16x8_t __p1) {
  64128   int32x4_t __ret;
  64129   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64130   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64131   __ret = __rev0 - __noswap_vmovl_high_s16(__rev1);
  64132   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64133   return __ret;
  64134 }
  64135 #endif
  64136 
  64137 #ifdef __LITTLE_ENDIAN__
  64138 __ai __attribute__((target("neon"))) poly8x8_t vtrn1_p8(poly8x8_t __p0, poly8x8_t __p1) {
  64139   poly8x8_t __ret;
  64140   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64141   return __ret;
  64142 }
  64143 #else
  64144 __ai __attribute__((target("neon"))) poly8x8_t vtrn1_p8(poly8x8_t __p0, poly8x8_t __p1) {
  64145   poly8x8_t __ret;
  64146   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64147   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64148   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64149   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64150   return __ret;
  64151 }
  64152 #endif
  64153 
  64154 #ifdef __LITTLE_ENDIAN__
  64155 __ai __attribute__((target("neon"))) poly16x4_t vtrn1_p16(poly16x4_t __p0, poly16x4_t __p1) {
  64156   poly16x4_t __ret;
  64157   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64158   return __ret;
  64159 }
  64160 #else
  64161 __ai __attribute__((target("neon"))) poly16x4_t vtrn1_p16(poly16x4_t __p0, poly16x4_t __p1) {
  64162   poly16x4_t __ret;
  64163   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64164   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64165   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64166   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64167   return __ret;
  64168 }
  64169 #endif
  64170 
  64171 #ifdef __LITTLE_ENDIAN__
  64172 __ai __attribute__((target("neon"))) poly8x16_t vtrn1q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  64173   poly8x16_t __ret;
  64174   __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30);
  64175   return __ret;
  64176 }
  64177 #else
  64178 __ai __attribute__((target("neon"))) poly8x16_t vtrn1q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  64179   poly8x16_t __ret;
  64180   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64181   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64182   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30);
  64183   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64184   return __ret;
  64185 }
  64186 #endif
  64187 
  64188 #ifdef __LITTLE_ENDIAN__
  64189 __ai __attribute__((target("neon"))) poly64x2_t vtrn1q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  64190   poly64x2_t __ret;
  64191   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64192   return __ret;
  64193 }
  64194 #else
  64195 __ai __attribute__((target("neon"))) poly64x2_t vtrn1q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  64196   poly64x2_t __ret;
  64197   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64198   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64199   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64200   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64201   return __ret;
  64202 }
  64203 #endif
  64204 
  64205 #ifdef __LITTLE_ENDIAN__
  64206 __ai __attribute__((target("neon"))) poly16x8_t vtrn1q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  64207   poly16x8_t __ret;
  64208   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64209   return __ret;
  64210 }
  64211 #else
  64212 __ai __attribute__((target("neon"))) poly16x8_t vtrn1q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  64213   poly16x8_t __ret;
  64214   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64215   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64216   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64217   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64218   return __ret;
  64219 }
  64220 #endif
  64221 
  64222 #ifdef __LITTLE_ENDIAN__
  64223 __ai __attribute__((target("neon"))) uint8x16_t vtrn1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  64224   uint8x16_t __ret;
  64225   __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30);
  64226   return __ret;
  64227 }
  64228 #else
  64229 __ai __attribute__((target("neon"))) uint8x16_t vtrn1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  64230   uint8x16_t __ret;
  64231   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64232   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64233   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30);
  64234   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64235   return __ret;
  64236 }
  64237 #endif
  64238 
  64239 #ifdef __LITTLE_ENDIAN__
  64240 __ai __attribute__((target("neon"))) uint32x4_t vtrn1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  64241   uint32x4_t __ret;
  64242   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64243   return __ret;
  64244 }
  64245 #else
  64246 __ai __attribute__((target("neon"))) uint32x4_t vtrn1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  64247   uint32x4_t __ret;
  64248   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64249   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64250   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64251   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64252   return __ret;
  64253 }
  64254 #endif
  64255 
  64256 #ifdef __LITTLE_ENDIAN__
  64257 __ai __attribute__((target("neon"))) uint64x2_t vtrn1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  64258   uint64x2_t __ret;
  64259   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64260   return __ret;
  64261 }
  64262 #else
  64263 __ai __attribute__((target("neon"))) uint64x2_t vtrn1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  64264   uint64x2_t __ret;
  64265   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64266   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64267   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64268   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64269   return __ret;
  64270 }
  64271 #endif
  64272 
  64273 #ifdef __LITTLE_ENDIAN__
  64274 __ai __attribute__((target("neon"))) uint16x8_t vtrn1q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  64275   uint16x8_t __ret;
  64276   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64277   return __ret;
  64278 }
  64279 #else
  64280 __ai __attribute__((target("neon"))) uint16x8_t vtrn1q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  64281   uint16x8_t __ret;
  64282   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64283   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64284   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64285   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64286   return __ret;
  64287 }
  64288 #endif
  64289 
  64290 #ifdef __LITTLE_ENDIAN__
  64291 __ai __attribute__((target("neon"))) int8x16_t vtrn1q_s8(int8x16_t __p0, int8x16_t __p1) {
  64292   int8x16_t __ret;
  64293   __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30);
  64294   return __ret;
  64295 }
  64296 #else
  64297 __ai __attribute__((target("neon"))) int8x16_t vtrn1q_s8(int8x16_t __p0, int8x16_t __p1) {
  64298   int8x16_t __ret;
  64299   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64300   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64301   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30);
  64302   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64303   return __ret;
  64304 }
  64305 #endif
  64306 
  64307 #ifdef __LITTLE_ENDIAN__
  64308 __ai __attribute__((target("neon"))) float64x2_t vtrn1q_f64(float64x2_t __p0, float64x2_t __p1) {
  64309   float64x2_t __ret;
  64310   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64311   return __ret;
  64312 }
  64313 #else
  64314 __ai __attribute__((target("neon"))) float64x2_t vtrn1q_f64(float64x2_t __p0, float64x2_t __p1) {
  64315   float64x2_t __ret;
  64316   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64317   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64318   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64319   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64320   return __ret;
  64321 }
  64322 #endif
  64323 
  64324 #ifdef __LITTLE_ENDIAN__
  64325 __ai __attribute__((target("neon"))) float32x4_t vtrn1q_f32(float32x4_t __p0, float32x4_t __p1) {
  64326   float32x4_t __ret;
  64327   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64328   return __ret;
  64329 }
  64330 #else
  64331 __ai __attribute__((target("neon"))) float32x4_t vtrn1q_f32(float32x4_t __p0, float32x4_t __p1) {
  64332   float32x4_t __ret;
  64333   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64334   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64335   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64336   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64337   return __ret;
  64338 }
  64339 #endif
  64340 
  64341 #ifdef __LITTLE_ENDIAN__
  64342 __ai __attribute__((target("neon"))) int32x4_t vtrn1q_s32(int32x4_t __p0, int32x4_t __p1) {
  64343   int32x4_t __ret;
  64344   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64345   return __ret;
  64346 }
  64347 #else
  64348 __ai __attribute__((target("neon"))) int32x4_t vtrn1q_s32(int32x4_t __p0, int32x4_t __p1) {
  64349   int32x4_t __ret;
  64350   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64351   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64352   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64353   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64354   return __ret;
  64355 }
  64356 #endif
  64357 
  64358 #ifdef __LITTLE_ENDIAN__
  64359 __ai __attribute__((target("neon"))) int64x2_t vtrn1q_s64(int64x2_t __p0, int64x2_t __p1) {
  64360   int64x2_t __ret;
  64361   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64362   return __ret;
  64363 }
  64364 #else
  64365 __ai __attribute__((target("neon"))) int64x2_t vtrn1q_s64(int64x2_t __p0, int64x2_t __p1) {
  64366   int64x2_t __ret;
  64367   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64368   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64369   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64370   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64371   return __ret;
  64372 }
  64373 #endif
  64374 
  64375 #ifdef __LITTLE_ENDIAN__
  64376 __ai __attribute__((target("neon"))) int16x8_t vtrn1q_s16(int16x8_t __p0, int16x8_t __p1) {
  64377   int16x8_t __ret;
  64378   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64379   return __ret;
  64380 }
  64381 #else
  64382 __ai __attribute__((target("neon"))) int16x8_t vtrn1q_s16(int16x8_t __p0, int16x8_t __p1) {
  64383   int16x8_t __ret;
  64384   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64385   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64386   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64387   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64388   return __ret;
  64389 }
  64390 #endif
  64391 
  64392 #ifdef __LITTLE_ENDIAN__
  64393 __ai __attribute__((target("neon"))) uint8x8_t vtrn1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  64394   uint8x8_t __ret;
  64395   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64396   return __ret;
  64397 }
  64398 #else
  64399 __ai __attribute__((target("neon"))) uint8x8_t vtrn1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  64400   uint8x8_t __ret;
  64401   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64402   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64403   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64404   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64405   return __ret;
  64406 }
  64407 #endif
  64408 
  64409 #ifdef __LITTLE_ENDIAN__
  64410 __ai __attribute__((target("neon"))) uint32x2_t vtrn1_u32(uint32x2_t __p0, uint32x2_t __p1) {
  64411   uint32x2_t __ret;
  64412   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64413   return __ret;
  64414 }
  64415 #else
  64416 __ai __attribute__((target("neon"))) uint32x2_t vtrn1_u32(uint32x2_t __p0, uint32x2_t __p1) {
  64417   uint32x2_t __ret;
  64418   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64419   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64420   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64421   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64422   return __ret;
  64423 }
  64424 #endif
  64425 
  64426 #ifdef __LITTLE_ENDIAN__
  64427 __ai __attribute__((target("neon"))) uint16x4_t vtrn1_u16(uint16x4_t __p0, uint16x4_t __p1) {
  64428   uint16x4_t __ret;
  64429   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64430   return __ret;
  64431 }
  64432 #else
  64433 __ai __attribute__((target("neon"))) uint16x4_t vtrn1_u16(uint16x4_t __p0, uint16x4_t __p1) {
  64434   uint16x4_t __ret;
  64435   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64436   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64437   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64438   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64439   return __ret;
  64440 }
  64441 #endif
  64442 
  64443 #ifdef __LITTLE_ENDIAN__
  64444 __ai __attribute__((target("neon"))) int8x8_t vtrn1_s8(int8x8_t __p0, int8x8_t __p1) {
  64445   int8x8_t __ret;
  64446   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64447   return __ret;
  64448 }
  64449 #else
  64450 __ai __attribute__((target("neon"))) int8x8_t vtrn1_s8(int8x8_t __p0, int8x8_t __p1) {
  64451   int8x8_t __ret;
  64452   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64453   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64454   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64455   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64456   return __ret;
  64457 }
  64458 #endif
  64459 
  64460 #ifdef __LITTLE_ENDIAN__
  64461 __ai __attribute__((target("neon"))) float32x2_t vtrn1_f32(float32x2_t __p0, float32x2_t __p1) {
  64462   float32x2_t __ret;
  64463   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64464   return __ret;
  64465 }
  64466 #else
  64467 __ai __attribute__((target("neon"))) float32x2_t vtrn1_f32(float32x2_t __p0, float32x2_t __p1) {
  64468   float32x2_t __ret;
  64469   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64470   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64471   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64472   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64473   return __ret;
  64474 }
  64475 #endif
  64476 
  64477 #ifdef __LITTLE_ENDIAN__
  64478 __ai __attribute__((target("neon"))) int32x2_t vtrn1_s32(int32x2_t __p0, int32x2_t __p1) {
  64479   int32x2_t __ret;
  64480   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  64481   return __ret;
  64482 }
  64483 #else
  64484 __ai __attribute__((target("neon"))) int32x2_t vtrn1_s32(int32x2_t __p0, int32x2_t __p1) {
  64485   int32x2_t __ret;
  64486   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64487   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64488   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  64489   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64490   return __ret;
  64491 }
  64492 #endif
  64493 
  64494 #ifdef __LITTLE_ENDIAN__
  64495 __ai __attribute__((target("neon"))) int16x4_t vtrn1_s16(int16x4_t __p0, int16x4_t __p1) {
  64496   int16x4_t __ret;
  64497   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64498   return __ret;
  64499 }
  64500 #else
  64501 __ai __attribute__((target("neon"))) int16x4_t vtrn1_s16(int16x4_t __p0, int16x4_t __p1) {
  64502   int16x4_t __ret;
  64503   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64504   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64505   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64506   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64507   return __ret;
  64508 }
  64509 #endif
  64510 
  64511 #ifdef __LITTLE_ENDIAN__
  64512 __ai __attribute__((target("neon"))) float16x8_t vtrn1q_f16(float16x8_t __p0, float16x8_t __p1) {
  64513   float16x8_t __ret;
  64514   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14);
  64515   return __ret;
  64516 }
  64517 #else
  64518 __ai __attribute__((target("neon"))) float16x8_t vtrn1q_f16(float16x8_t __p0, float16x8_t __p1) {
  64519   float16x8_t __ret;
  64520   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64521   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64522   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14);
  64523   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64524   return __ret;
  64525 }
  64526 #endif
  64527 
  64528 #ifdef __LITTLE_ENDIAN__
  64529 __ai __attribute__((target("neon"))) float16x4_t vtrn1_f16(float16x4_t __p0, float16x4_t __p1) {
  64530   float16x4_t __ret;
  64531   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6);
  64532   return __ret;
  64533 }
  64534 #else
  64535 __ai __attribute__((target("neon"))) float16x4_t vtrn1_f16(float16x4_t __p0, float16x4_t __p1) {
  64536   float16x4_t __ret;
  64537   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64538   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64539   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6);
  64540   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64541   return __ret;
  64542 }
  64543 #endif
  64544 
  64545 #ifdef __LITTLE_ENDIAN__
  64546 __ai __attribute__((target("neon"))) poly8x8_t vtrn2_p8(poly8x8_t __p0, poly8x8_t __p1) {
  64547   poly8x8_t __ret;
  64548   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64549   return __ret;
  64550 }
  64551 #else
  64552 __ai __attribute__((target("neon"))) poly8x8_t vtrn2_p8(poly8x8_t __p0, poly8x8_t __p1) {
  64553   poly8x8_t __ret;
  64554   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64555   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64556   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64557   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64558   return __ret;
  64559 }
  64560 #endif
  64561 
  64562 #ifdef __LITTLE_ENDIAN__
  64563 __ai __attribute__((target("neon"))) poly16x4_t vtrn2_p16(poly16x4_t __p0, poly16x4_t __p1) {
  64564   poly16x4_t __ret;
  64565   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64566   return __ret;
  64567 }
  64568 #else
  64569 __ai __attribute__((target("neon"))) poly16x4_t vtrn2_p16(poly16x4_t __p0, poly16x4_t __p1) {
  64570   poly16x4_t __ret;
  64571   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64572   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64573   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64574   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64575   return __ret;
  64576 }
  64577 #endif
  64578 
  64579 #ifdef __LITTLE_ENDIAN__
  64580 __ai __attribute__((target("neon"))) poly8x16_t vtrn2q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  64581   poly8x16_t __ret;
  64582   __ret = __builtin_shufflevector(__p0, __p1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31);
  64583   return __ret;
  64584 }
  64585 #else
  64586 __ai __attribute__((target("neon"))) poly8x16_t vtrn2q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  64587   poly8x16_t __ret;
  64588   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64589   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64590   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31);
  64591   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64592   return __ret;
  64593 }
  64594 #endif
  64595 
  64596 #ifdef __LITTLE_ENDIAN__
  64597 __ai __attribute__((target("neon"))) poly64x2_t vtrn2q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  64598   poly64x2_t __ret;
  64599   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64600   return __ret;
  64601 }
  64602 #else
  64603 __ai __attribute__((target("neon"))) poly64x2_t vtrn2q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  64604   poly64x2_t __ret;
  64605   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64606   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64607   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64608   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64609   return __ret;
  64610 }
  64611 #endif
  64612 
  64613 #ifdef __LITTLE_ENDIAN__
  64614 __ai __attribute__((target("neon"))) poly16x8_t vtrn2q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  64615   poly16x8_t __ret;
  64616   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64617   return __ret;
  64618 }
  64619 #else
  64620 __ai __attribute__((target("neon"))) poly16x8_t vtrn2q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  64621   poly16x8_t __ret;
  64622   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64623   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64624   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64625   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64626   return __ret;
  64627 }
  64628 #endif
  64629 
  64630 #ifdef __LITTLE_ENDIAN__
  64631 __ai __attribute__((target("neon"))) uint8x16_t vtrn2q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  64632   uint8x16_t __ret;
  64633   __ret = __builtin_shufflevector(__p0, __p1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31);
  64634   return __ret;
  64635 }
  64636 #else
  64637 __ai __attribute__((target("neon"))) uint8x16_t vtrn2q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  64638   uint8x16_t __ret;
  64639   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64640   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64641   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31);
  64642   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64643   return __ret;
  64644 }
  64645 #endif
  64646 
  64647 #ifdef __LITTLE_ENDIAN__
  64648 __ai __attribute__((target("neon"))) uint32x4_t vtrn2q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  64649   uint32x4_t __ret;
  64650   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64651   return __ret;
  64652 }
  64653 #else
  64654 __ai __attribute__((target("neon"))) uint32x4_t vtrn2q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  64655   uint32x4_t __ret;
  64656   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64657   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64658   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64659   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64660   return __ret;
  64661 }
  64662 #endif
  64663 
  64664 #ifdef __LITTLE_ENDIAN__
  64665 __ai __attribute__((target("neon"))) uint64x2_t vtrn2q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  64666   uint64x2_t __ret;
  64667   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64668   return __ret;
  64669 }
  64670 #else
  64671 __ai __attribute__((target("neon"))) uint64x2_t vtrn2q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  64672   uint64x2_t __ret;
  64673   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64674   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64675   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64676   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64677   return __ret;
  64678 }
  64679 #endif
  64680 
  64681 #ifdef __LITTLE_ENDIAN__
  64682 __ai __attribute__((target("neon"))) uint16x8_t vtrn2q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  64683   uint16x8_t __ret;
  64684   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64685   return __ret;
  64686 }
  64687 #else
  64688 __ai __attribute__((target("neon"))) uint16x8_t vtrn2q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  64689   uint16x8_t __ret;
  64690   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64691   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64692   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64693   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64694   return __ret;
  64695 }
  64696 #endif
  64697 
  64698 #ifdef __LITTLE_ENDIAN__
  64699 __ai __attribute__((target("neon"))) int8x16_t vtrn2q_s8(int8x16_t __p0, int8x16_t __p1) {
  64700   int8x16_t __ret;
  64701   __ret = __builtin_shufflevector(__p0, __p1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31);
  64702   return __ret;
  64703 }
  64704 #else
  64705 __ai __attribute__((target("neon"))) int8x16_t vtrn2q_s8(int8x16_t __p0, int8x16_t __p1) {
  64706   int8x16_t __ret;
  64707   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64708   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64709   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31);
  64710   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  64711   return __ret;
  64712 }
  64713 #endif
  64714 
  64715 #ifdef __LITTLE_ENDIAN__
  64716 __ai __attribute__((target("neon"))) float64x2_t vtrn2q_f64(float64x2_t __p0, float64x2_t __p1) {
  64717   float64x2_t __ret;
  64718   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64719   return __ret;
  64720 }
  64721 #else
  64722 __ai __attribute__((target("neon"))) float64x2_t vtrn2q_f64(float64x2_t __p0, float64x2_t __p1) {
  64723   float64x2_t __ret;
  64724   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64725   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64726   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64727   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64728   return __ret;
  64729 }
  64730 #endif
  64731 
  64732 #ifdef __LITTLE_ENDIAN__
  64733 __ai __attribute__((target("neon"))) float32x4_t vtrn2q_f32(float32x4_t __p0, float32x4_t __p1) {
  64734   float32x4_t __ret;
  64735   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64736   return __ret;
  64737 }
  64738 #else
  64739 __ai __attribute__((target("neon"))) float32x4_t vtrn2q_f32(float32x4_t __p0, float32x4_t __p1) {
  64740   float32x4_t __ret;
  64741   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64742   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64743   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64744   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64745   return __ret;
  64746 }
  64747 #endif
  64748 
  64749 #ifdef __LITTLE_ENDIAN__
  64750 __ai __attribute__((target("neon"))) int32x4_t vtrn2q_s32(int32x4_t __p0, int32x4_t __p1) {
  64751   int32x4_t __ret;
  64752   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64753   return __ret;
  64754 }
  64755 #else
  64756 __ai __attribute__((target("neon"))) int32x4_t vtrn2q_s32(int32x4_t __p0, int32x4_t __p1) {
  64757   int32x4_t __ret;
  64758   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64759   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64760   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64761   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64762   return __ret;
  64763 }
  64764 #endif
  64765 
  64766 #ifdef __LITTLE_ENDIAN__
  64767 __ai __attribute__((target("neon"))) int64x2_t vtrn2q_s64(int64x2_t __p0, int64x2_t __p1) {
  64768   int64x2_t __ret;
  64769   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64770   return __ret;
  64771 }
  64772 #else
  64773 __ai __attribute__((target("neon"))) int64x2_t vtrn2q_s64(int64x2_t __p0, int64x2_t __p1) {
  64774   int64x2_t __ret;
  64775   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64776   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64777   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64778   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64779   return __ret;
  64780 }
  64781 #endif
  64782 
  64783 #ifdef __LITTLE_ENDIAN__
  64784 __ai __attribute__((target("neon"))) int16x8_t vtrn2q_s16(int16x8_t __p0, int16x8_t __p1) {
  64785   int16x8_t __ret;
  64786   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64787   return __ret;
  64788 }
  64789 #else
  64790 __ai __attribute__((target("neon"))) int16x8_t vtrn2q_s16(int16x8_t __p0, int16x8_t __p1) {
  64791   int16x8_t __ret;
  64792   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64793   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64794   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64795   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64796   return __ret;
  64797 }
  64798 #endif
  64799 
  64800 #ifdef __LITTLE_ENDIAN__
  64801 __ai __attribute__((target("neon"))) uint8x8_t vtrn2_u8(uint8x8_t __p0, uint8x8_t __p1) {
  64802   uint8x8_t __ret;
  64803   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64804   return __ret;
  64805 }
  64806 #else
  64807 __ai __attribute__((target("neon"))) uint8x8_t vtrn2_u8(uint8x8_t __p0, uint8x8_t __p1) {
  64808   uint8x8_t __ret;
  64809   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64810   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64811   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64812   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64813   return __ret;
  64814 }
  64815 #endif
  64816 
  64817 #ifdef __LITTLE_ENDIAN__
  64818 __ai __attribute__((target("neon"))) uint32x2_t vtrn2_u32(uint32x2_t __p0, uint32x2_t __p1) {
  64819   uint32x2_t __ret;
  64820   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64821   return __ret;
  64822 }
  64823 #else
  64824 __ai __attribute__((target("neon"))) uint32x2_t vtrn2_u32(uint32x2_t __p0, uint32x2_t __p1) {
  64825   uint32x2_t __ret;
  64826   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64827   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64828   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64829   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64830   return __ret;
  64831 }
  64832 #endif
  64833 
  64834 #ifdef __LITTLE_ENDIAN__
  64835 __ai __attribute__((target("neon"))) uint16x4_t vtrn2_u16(uint16x4_t __p0, uint16x4_t __p1) {
  64836   uint16x4_t __ret;
  64837   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64838   return __ret;
  64839 }
  64840 #else
  64841 __ai __attribute__((target("neon"))) uint16x4_t vtrn2_u16(uint16x4_t __p0, uint16x4_t __p1) {
  64842   uint16x4_t __ret;
  64843   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64844   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64845   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64846   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64847   return __ret;
  64848 }
  64849 #endif
  64850 
  64851 #ifdef __LITTLE_ENDIAN__
  64852 __ai __attribute__((target("neon"))) int8x8_t vtrn2_s8(int8x8_t __p0, int8x8_t __p1) {
  64853   int8x8_t __ret;
  64854   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64855   return __ret;
  64856 }
  64857 #else
  64858 __ai __attribute__((target("neon"))) int8x8_t vtrn2_s8(int8x8_t __p0, int8x8_t __p1) {
  64859   int8x8_t __ret;
  64860   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64861   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64862   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64863   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64864   return __ret;
  64865 }
  64866 #endif
  64867 
  64868 #ifdef __LITTLE_ENDIAN__
  64869 __ai __attribute__((target("neon"))) float32x2_t vtrn2_f32(float32x2_t __p0, float32x2_t __p1) {
  64870   float32x2_t __ret;
  64871   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64872   return __ret;
  64873 }
  64874 #else
  64875 __ai __attribute__((target("neon"))) float32x2_t vtrn2_f32(float32x2_t __p0, float32x2_t __p1) {
  64876   float32x2_t __ret;
  64877   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64878   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64879   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64880   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64881   return __ret;
  64882 }
  64883 #endif
  64884 
  64885 #ifdef __LITTLE_ENDIAN__
  64886 __ai __attribute__((target("neon"))) int32x2_t vtrn2_s32(int32x2_t __p0, int32x2_t __p1) {
  64887   int32x2_t __ret;
  64888   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  64889   return __ret;
  64890 }
  64891 #else
  64892 __ai __attribute__((target("neon"))) int32x2_t vtrn2_s32(int32x2_t __p0, int32x2_t __p1) {
  64893   int32x2_t __ret;
  64894   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64895   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64896   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  64897   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64898   return __ret;
  64899 }
  64900 #endif
  64901 
  64902 #ifdef __LITTLE_ENDIAN__
  64903 __ai __attribute__((target("neon"))) int16x4_t vtrn2_s16(int16x4_t __p0, int16x4_t __p1) {
  64904   int16x4_t __ret;
  64905   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64906   return __ret;
  64907 }
  64908 #else
  64909 __ai __attribute__((target("neon"))) int16x4_t vtrn2_s16(int16x4_t __p0, int16x4_t __p1) {
  64910   int16x4_t __ret;
  64911   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64912   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64913   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64914   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64915   return __ret;
  64916 }
  64917 #endif
  64918 
  64919 #ifdef __LITTLE_ENDIAN__
  64920 __ai __attribute__((target("neon"))) float16x8_t vtrn2q_f16(float16x8_t __p0, float16x8_t __p1) {
  64921   float16x8_t __ret;
  64922   __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15);
  64923   return __ret;
  64924 }
  64925 #else
  64926 __ai __attribute__((target("neon"))) float16x8_t vtrn2q_f16(float16x8_t __p0, float16x8_t __p1) {
  64927   float16x8_t __ret;
  64928   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  64929   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  64930   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15);
  64931   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  64932   return __ret;
  64933 }
  64934 #endif
  64935 
  64936 #ifdef __LITTLE_ENDIAN__
  64937 __ai __attribute__((target("neon"))) float16x4_t vtrn2_f16(float16x4_t __p0, float16x4_t __p1) {
  64938   float16x4_t __ret;
  64939   __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7);
  64940   return __ret;
  64941 }
  64942 #else
  64943 __ai __attribute__((target("neon"))) float16x4_t vtrn2_f16(float16x4_t __p0, float16x4_t __p1) {
  64944   float16x4_t __ret;
  64945   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  64946   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  64947   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7);
  64948   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  64949   return __ret;
  64950 }
  64951 #endif
  64952 
  64953 __ai __attribute__((target("neon"))) uint64x1_t vtst_p64(poly64x1_t __p0, poly64x1_t __p1) {
  64954   uint64x1_t __ret;
  64955   __ret = (uint64x1_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  64956   return __ret;
  64957 }
  64958 #ifdef __LITTLE_ENDIAN__
  64959 __ai __attribute__((target("neon"))) uint64x2_t vtstq_p64(poly64x2_t __p0, poly64x2_t __p1) {
  64960   uint64x2_t __ret;
  64961   __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  64962   return __ret;
  64963 }
  64964 #else
  64965 __ai __attribute__((target("neon"))) uint64x2_t vtstq_p64(poly64x2_t __p0, poly64x2_t __p1) {
  64966   uint64x2_t __ret;
  64967   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64968   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64969   __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  64970   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64971   return __ret;
  64972 }
  64973 #endif
  64974 
  64975 #ifdef __LITTLE_ENDIAN__
  64976 __ai __attribute__((target("neon"))) uint64x2_t vtstq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  64977   uint64x2_t __ret;
  64978   __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  64979   return __ret;
  64980 }
  64981 #else
  64982 __ai __attribute__((target("neon"))) uint64x2_t vtstq_u64(uint64x2_t __p0, uint64x2_t __p1) {
  64983   uint64x2_t __ret;
  64984   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  64985   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  64986   __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  64987   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  64988   return __ret;
  64989 }
  64990 #endif
  64991 
  64992 #ifdef __LITTLE_ENDIAN__
  64993 __ai __attribute__((target("neon"))) uint64x2_t vtstq_s64(int64x2_t __p0, int64x2_t __p1) {
  64994   uint64x2_t __ret;
  64995   __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 51);
  64996   return __ret;
  64997 }
  64998 #else
  64999 __ai __attribute__((target("neon"))) uint64x2_t vtstq_s64(int64x2_t __p0, int64x2_t __p1) {
  65000   uint64x2_t __ret;
  65001   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65002   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65003   __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  65004   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65005   return __ret;
  65006 }
  65007 #endif
  65008 
  65009 __ai __attribute__((target("neon"))) uint64x1_t vtst_u64(uint64x1_t __p0, uint64x1_t __p1) {
  65010   uint64x1_t __ret;
  65011   __ret = (uint64x1_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  65012   return __ret;
  65013 }
  65014 __ai __attribute__((target("neon"))) uint64x1_t vtst_s64(int64x1_t __p0, int64x1_t __p1) {
  65015   uint64x1_t __ret;
  65016   __ret = (uint64x1_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 19);
  65017   return __ret;
  65018 }
  65019 __ai __attribute__((target("neon"))) uint64_t vtstd_u64(uint64_t __p0, uint64_t __p1) {
  65020   uint64_t __ret;
  65021   __ret = (uint64_t) __builtin_neon_vtstd_u64(__p0, __p1);
  65022   return __ret;
  65023 }
  65024 __ai __attribute__((target("neon"))) uint64_t vtstd_s64(int64_t __p0, int64_t __p1) {
  65025   uint64_t __ret;
  65026   __ret = (uint64_t) __builtin_neon_vtstd_s64(__p0, __p1);
  65027   return __ret;
  65028 }
  65029 __ai __attribute__((target("neon"))) int8_t vuqaddb_s8(int8_t __p0, uint8_t __p1) {
  65030   int8_t __ret;
  65031   __ret = (int8_t) __builtin_neon_vuqaddb_s8(__p0, __p1);
  65032   return __ret;
  65033 }
  65034 __ai __attribute__((target("neon"))) int32_t vuqadds_s32(int32_t __p0, uint32_t __p1) {
  65035   int32_t __ret;
  65036   __ret = (int32_t) __builtin_neon_vuqadds_s32(__p0, __p1);
  65037   return __ret;
  65038 }
  65039 __ai __attribute__((target("neon"))) int64_t vuqaddd_s64(int64_t __p0, uint64_t __p1) {
  65040   int64_t __ret;
  65041   __ret = (int64_t) __builtin_neon_vuqaddd_s64(__p0, __p1);
  65042   return __ret;
  65043 }
  65044 __ai __attribute__((target("neon"))) int16_t vuqaddh_s16(int16_t __p0, uint16_t __p1) {
  65045   int16_t __ret;
  65046   __ret = (int16_t) __builtin_neon_vuqaddh_s16(__p0, __p1);
  65047   return __ret;
  65048 }
  65049 #ifdef __LITTLE_ENDIAN__
  65050 __ai __attribute__((target("neon"))) int8x16_t vuqaddq_s8(int8x16_t __p0, uint8x16_t __p1) {
  65051   int8x16_t __ret;
  65052   __ret = (int8x16_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32);
  65053   return __ret;
  65054 }
  65055 #else
  65056 __ai __attribute__((target("neon"))) int8x16_t vuqaddq_s8(int8x16_t __p0, uint8x16_t __p1) {
  65057   int8x16_t __ret;
  65058   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65059   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65060   __ret = (int8x16_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32);
  65061   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65062   return __ret;
  65063 }
  65064 #endif
  65065 
  65066 #ifdef __LITTLE_ENDIAN__
  65067 __ai __attribute__((target("neon"))) int32x4_t vuqaddq_s32(int32x4_t __p0, uint32x4_t __p1) {
  65068   int32x4_t __ret;
  65069   __ret = (int32x4_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34);
  65070   return __ret;
  65071 }
  65072 #else
  65073 __ai __attribute__((target("neon"))) int32x4_t vuqaddq_s32(int32x4_t __p0, uint32x4_t __p1) {
  65074   int32x4_t __ret;
  65075   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65076   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65077   __ret = (int32x4_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34);
  65078   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65079   return __ret;
  65080 }
  65081 #endif
  65082 
  65083 #ifdef __LITTLE_ENDIAN__
  65084 __ai __attribute__((target("neon"))) int64x2_t vuqaddq_s64(int64x2_t __p0, uint64x2_t __p1) {
  65085   int64x2_t __ret;
  65086   __ret = (int64x2_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 35);
  65087   return __ret;
  65088 }
  65089 #else
  65090 __ai __attribute__((target("neon"))) int64x2_t vuqaddq_s64(int64x2_t __p0, uint64x2_t __p1) {
  65091   int64x2_t __ret;
  65092   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65093   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65094   __ret = (int64x2_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35);
  65095   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65096   return __ret;
  65097 }
  65098 #endif
  65099 
  65100 #ifdef __LITTLE_ENDIAN__
  65101 __ai __attribute__((target("neon"))) int16x8_t vuqaddq_s16(int16x8_t __p0, uint16x8_t __p1) {
  65102   int16x8_t __ret;
  65103   __ret = (int16x8_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33);
  65104   return __ret;
  65105 }
  65106 #else
  65107 __ai __attribute__((target("neon"))) int16x8_t vuqaddq_s16(int16x8_t __p0, uint16x8_t __p1) {
  65108   int16x8_t __ret;
  65109   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65110   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65111   __ret = (int16x8_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33);
  65112   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65113   return __ret;
  65114 }
  65115 #endif
  65116 
  65117 #ifdef __LITTLE_ENDIAN__
  65118 __ai __attribute__((target("neon"))) int8x8_t vuqadd_s8(int8x8_t __p0, uint8x8_t __p1) {
  65119   int8x8_t __ret;
  65120   __ret = (int8x8_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0);
  65121   return __ret;
  65122 }
  65123 #else
  65124 __ai __attribute__((target("neon"))) int8x8_t vuqadd_s8(int8x8_t __p0, uint8x8_t __p1) {
  65125   int8x8_t __ret;
  65126   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65127   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65128   __ret = (int8x8_t) __builtin_neon_vuqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0);
  65129   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65130   return __ret;
  65131 }
  65132 #endif
  65133 
  65134 #ifdef __LITTLE_ENDIAN__
  65135 __ai __attribute__((target("neon"))) int32x2_t vuqadd_s32(int32x2_t __p0, uint32x2_t __p1) {
  65136   int32x2_t __ret;
  65137   __ret = (int32x2_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2);
  65138   return __ret;
  65139 }
  65140 #else
  65141 __ai __attribute__((target("neon"))) int32x2_t vuqadd_s32(int32x2_t __p0, uint32x2_t __p1) {
  65142   int32x2_t __ret;
  65143   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65144   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65145   __ret = (int32x2_t) __builtin_neon_vuqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2);
  65146   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65147   return __ret;
  65148 }
  65149 #endif
  65150 
  65151 __ai __attribute__((target("neon"))) int64x1_t vuqadd_s64(int64x1_t __p0, uint64x1_t __p1) {
  65152   int64x1_t __ret;
  65153   __ret = (int64x1_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 3);
  65154   return __ret;
  65155 }
  65156 #ifdef __LITTLE_ENDIAN__
  65157 __ai __attribute__((target("neon"))) int16x4_t vuqadd_s16(int16x4_t __p0, uint16x4_t __p1) {
  65158   int16x4_t __ret;
  65159   __ret = (int16x4_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1);
  65160   return __ret;
  65161 }
  65162 #else
  65163 __ai __attribute__((target("neon"))) int16x4_t vuqadd_s16(int16x4_t __p0, uint16x4_t __p1) {
  65164   int16x4_t __ret;
  65165   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65166   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65167   __ret = (int16x4_t) __builtin_neon_vuqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1);
  65168   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65169   return __ret;
  65170 }
  65171 #endif
  65172 
  65173 #ifdef __LITTLE_ENDIAN__
  65174 __ai __attribute__((target("neon"))) poly8x8_t vuzp1_p8(poly8x8_t __p0, poly8x8_t __p1) {
  65175   poly8x8_t __ret;
  65176   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65177   return __ret;
  65178 }
  65179 #else
  65180 __ai __attribute__((target("neon"))) poly8x8_t vuzp1_p8(poly8x8_t __p0, poly8x8_t __p1) {
  65181   poly8x8_t __ret;
  65182   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65183   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65184   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65185   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65186   return __ret;
  65187 }
  65188 #endif
  65189 
  65190 #ifdef __LITTLE_ENDIAN__
  65191 __ai __attribute__((target("neon"))) poly16x4_t vuzp1_p16(poly16x4_t __p0, poly16x4_t __p1) {
  65192   poly16x4_t __ret;
  65193   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65194   return __ret;
  65195 }
  65196 #else
  65197 __ai __attribute__((target("neon"))) poly16x4_t vuzp1_p16(poly16x4_t __p0, poly16x4_t __p1) {
  65198   poly16x4_t __ret;
  65199   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65200   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65201   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65202   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65203   return __ret;
  65204 }
  65205 #endif
  65206 
  65207 #ifdef __LITTLE_ENDIAN__
  65208 __ai __attribute__((target("neon"))) poly8x16_t vuzp1q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  65209   poly8x16_t __ret;
  65210   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30);
  65211   return __ret;
  65212 }
  65213 #else
  65214 __ai __attribute__((target("neon"))) poly8x16_t vuzp1q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  65215   poly8x16_t __ret;
  65216   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65217   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65218   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30);
  65219   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65220   return __ret;
  65221 }
  65222 #endif
  65223 
  65224 #ifdef __LITTLE_ENDIAN__
  65225 __ai __attribute__((target("neon"))) poly64x2_t vuzp1q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  65226   poly64x2_t __ret;
  65227   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65228   return __ret;
  65229 }
  65230 #else
  65231 __ai __attribute__((target("neon"))) poly64x2_t vuzp1q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  65232   poly64x2_t __ret;
  65233   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65234   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65235   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65236   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65237   return __ret;
  65238 }
  65239 #endif
  65240 
  65241 #ifdef __LITTLE_ENDIAN__
  65242 __ai __attribute__((target("neon"))) poly16x8_t vuzp1q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  65243   poly16x8_t __ret;
  65244   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65245   return __ret;
  65246 }
  65247 #else
  65248 __ai __attribute__((target("neon"))) poly16x8_t vuzp1q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  65249   poly16x8_t __ret;
  65250   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65251   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65252   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65253   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65254   return __ret;
  65255 }
  65256 #endif
  65257 
  65258 #ifdef __LITTLE_ENDIAN__
  65259 __ai __attribute__((target("neon"))) uint8x16_t vuzp1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  65260   uint8x16_t __ret;
  65261   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30);
  65262   return __ret;
  65263 }
  65264 #else
  65265 __ai __attribute__((target("neon"))) uint8x16_t vuzp1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  65266   uint8x16_t __ret;
  65267   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65268   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65269   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30);
  65270   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65271   return __ret;
  65272 }
  65273 #endif
  65274 
  65275 #ifdef __LITTLE_ENDIAN__
  65276 __ai __attribute__((target("neon"))) uint32x4_t vuzp1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  65277   uint32x4_t __ret;
  65278   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65279   return __ret;
  65280 }
  65281 #else
  65282 __ai __attribute__((target("neon"))) uint32x4_t vuzp1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  65283   uint32x4_t __ret;
  65284   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65285   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65286   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65287   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65288   return __ret;
  65289 }
  65290 #endif
  65291 
  65292 #ifdef __LITTLE_ENDIAN__
  65293 __ai __attribute__((target("neon"))) uint64x2_t vuzp1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  65294   uint64x2_t __ret;
  65295   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65296   return __ret;
  65297 }
  65298 #else
  65299 __ai __attribute__((target("neon"))) uint64x2_t vuzp1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  65300   uint64x2_t __ret;
  65301   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65302   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65303   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65304   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65305   return __ret;
  65306 }
  65307 #endif
  65308 
  65309 #ifdef __LITTLE_ENDIAN__
  65310 __ai __attribute__((target("neon"))) uint16x8_t vuzp1q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  65311   uint16x8_t __ret;
  65312   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65313   return __ret;
  65314 }
  65315 #else
  65316 __ai __attribute__((target("neon"))) uint16x8_t vuzp1q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  65317   uint16x8_t __ret;
  65318   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65319   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65320   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65321   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65322   return __ret;
  65323 }
  65324 #endif
  65325 
  65326 #ifdef __LITTLE_ENDIAN__
  65327 __ai __attribute__((target("neon"))) int8x16_t vuzp1q_s8(int8x16_t __p0, int8x16_t __p1) {
  65328   int8x16_t __ret;
  65329   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30);
  65330   return __ret;
  65331 }
  65332 #else
  65333 __ai __attribute__((target("neon"))) int8x16_t vuzp1q_s8(int8x16_t __p0, int8x16_t __p1) {
  65334   int8x16_t __ret;
  65335   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65336   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65337   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30);
  65338   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65339   return __ret;
  65340 }
  65341 #endif
  65342 
  65343 #ifdef __LITTLE_ENDIAN__
  65344 __ai __attribute__((target("neon"))) float64x2_t vuzp1q_f64(float64x2_t __p0, float64x2_t __p1) {
  65345   float64x2_t __ret;
  65346   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65347   return __ret;
  65348 }
  65349 #else
  65350 __ai __attribute__((target("neon"))) float64x2_t vuzp1q_f64(float64x2_t __p0, float64x2_t __p1) {
  65351   float64x2_t __ret;
  65352   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65353   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65354   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65355   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65356   return __ret;
  65357 }
  65358 #endif
  65359 
  65360 #ifdef __LITTLE_ENDIAN__
  65361 __ai __attribute__((target("neon"))) float32x4_t vuzp1q_f32(float32x4_t __p0, float32x4_t __p1) {
  65362   float32x4_t __ret;
  65363   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65364   return __ret;
  65365 }
  65366 #else
  65367 __ai __attribute__((target("neon"))) float32x4_t vuzp1q_f32(float32x4_t __p0, float32x4_t __p1) {
  65368   float32x4_t __ret;
  65369   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65370   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65371   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65372   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65373   return __ret;
  65374 }
  65375 #endif
  65376 
  65377 #ifdef __LITTLE_ENDIAN__
  65378 __ai __attribute__((target("neon"))) int32x4_t vuzp1q_s32(int32x4_t __p0, int32x4_t __p1) {
  65379   int32x4_t __ret;
  65380   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65381   return __ret;
  65382 }
  65383 #else
  65384 __ai __attribute__((target("neon"))) int32x4_t vuzp1q_s32(int32x4_t __p0, int32x4_t __p1) {
  65385   int32x4_t __ret;
  65386   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65387   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65388   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65389   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65390   return __ret;
  65391 }
  65392 #endif
  65393 
  65394 #ifdef __LITTLE_ENDIAN__
  65395 __ai __attribute__((target("neon"))) int64x2_t vuzp1q_s64(int64x2_t __p0, int64x2_t __p1) {
  65396   int64x2_t __ret;
  65397   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65398   return __ret;
  65399 }
  65400 #else
  65401 __ai __attribute__((target("neon"))) int64x2_t vuzp1q_s64(int64x2_t __p0, int64x2_t __p1) {
  65402   int64x2_t __ret;
  65403   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65404   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65405   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65406   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65407   return __ret;
  65408 }
  65409 #endif
  65410 
  65411 #ifdef __LITTLE_ENDIAN__
  65412 __ai __attribute__((target("neon"))) int16x8_t vuzp1q_s16(int16x8_t __p0, int16x8_t __p1) {
  65413   int16x8_t __ret;
  65414   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65415   return __ret;
  65416 }
  65417 #else
  65418 __ai __attribute__((target("neon"))) int16x8_t vuzp1q_s16(int16x8_t __p0, int16x8_t __p1) {
  65419   int16x8_t __ret;
  65420   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65421   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65422   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65423   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65424   return __ret;
  65425 }
  65426 #endif
  65427 
  65428 #ifdef __LITTLE_ENDIAN__
  65429 __ai __attribute__((target("neon"))) uint8x8_t vuzp1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  65430   uint8x8_t __ret;
  65431   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65432   return __ret;
  65433 }
  65434 #else
  65435 __ai __attribute__((target("neon"))) uint8x8_t vuzp1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  65436   uint8x8_t __ret;
  65437   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65438   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65439   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65440   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65441   return __ret;
  65442 }
  65443 #endif
  65444 
  65445 #ifdef __LITTLE_ENDIAN__
  65446 __ai __attribute__((target("neon"))) uint32x2_t vuzp1_u32(uint32x2_t __p0, uint32x2_t __p1) {
  65447   uint32x2_t __ret;
  65448   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65449   return __ret;
  65450 }
  65451 #else
  65452 __ai __attribute__((target("neon"))) uint32x2_t vuzp1_u32(uint32x2_t __p0, uint32x2_t __p1) {
  65453   uint32x2_t __ret;
  65454   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65455   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65456   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65457   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65458   return __ret;
  65459 }
  65460 #endif
  65461 
  65462 #ifdef __LITTLE_ENDIAN__
  65463 __ai __attribute__((target("neon"))) uint16x4_t vuzp1_u16(uint16x4_t __p0, uint16x4_t __p1) {
  65464   uint16x4_t __ret;
  65465   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65466   return __ret;
  65467 }
  65468 #else
  65469 __ai __attribute__((target("neon"))) uint16x4_t vuzp1_u16(uint16x4_t __p0, uint16x4_t __p1) {
  65470   uint16x4_t __ret;
  65471   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65472   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65473   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65474   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65475   return __ret;
  65476 }
  65477 #endif
  65478 
  65479 #ifdef __LITTLE_ENDIAN__
  65480 __ai __attribute__((target("neon"))) int8x8_t vuzp1_s8(int8x8_t __p0, int8x8_t __p1) {
  65481   int8x8_t __ret;
  65482   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65483   return __ret;
  65484 }
  65485 #else
  65486 __ai __attribute__((target("neon"))) int8x8_t vuzp1_s8(int8x8_t __p0, int8x8_t __p1) {
  65487   int8x8_t __ret;
  65488   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65489   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65490   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65491   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65492   return __ret;
  65493 }
  65494 #endif
  65495 
  65496 #ifdef __LITTLE_ENDIAN__
  65497 __ai __attribute__((target("neon"))) float32x2_t vuzp1_f32(float32x2_t __p0, float32x2_t __p1) {
  65498   float32x2_t __ret;
  65499   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65500   return __ret;
  65501 }
  65502 #else
  65503 __ai __attribute__((target("neon"))) float32x2_t vuzp1_f32(float32x2_t __p0, float32x2_t __p1) {
  65504   float32x2_t __ret;
  65505   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65506   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65507   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65508   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65509   return __ret;
  65510 }
  65511 #endif
  65512 
  65513 #ifdef __LITTLE_ENDIAN__
  65514 __ai __attribute__((target("neon"))) int32x2_t vuzp1_s32(int32x2_t __p0, int32x2_t __p1) {
  65515   int32x2_t __ret;
  65516   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  65517   return __ret;
  65518 }
  65519 #else
  65520 __ai __attribute__((target("neon"))) int32x2_t vuzp1_s32(int32x2_t __p0, int32x2_t __p1) {
  65521   int32x2_t __ret;
  65522   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65523   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65524   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  65525   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65526   return __ret;
  65527 }
  65528 #endif
  65529 
  65530 #ifdef __LITTLE_ENDIAN__
  65531 __ai __attribute__((target("neon"))) int16x4_t vuzp1_s16(int16x4_t __p0, int16x4_t __p1) {
  65532   int16x4_t __ret;
  65533   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65534   return __ret;
  65535 }
  65536 #else
  65537 __ai __attribute__((target("neon"))) int16x4_t vuzp1_s16(int16x4_t __p0, int16x4_t __p1) {
  65538   int16x4_t __ret;
  65539   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65540   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65541   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65542   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65543   return __ret;
  65544 }
  65545 #endif
  65546 
  65547 #ifdef __LITTLE_ENDIAN__
  65548 __ai __attribute__((target("neon"))) float16x8_t vuzp1q_f16(float16x8_t __p0, float16x8_t __p1) {
  65549   float16x8_t __ret;
  65550   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14);
  65551   return __ret;
  65552 }
  65553 #else
  65554 __ai __attribute__((target("neon"))) float16x8_t vuzp1q_f16(float16x8_t __p0, float16x8_t __p1) {
  65555   float16x8_t __ret;
  65556   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65557   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65558   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14);
  65559   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65560   return __ret;
  65561 }
  65562 #endif
  65563 
  65564 #ifdef __LITTLE_ENDIAN__
  65565 __ai __attribute__((target("neon"))) float16x4_t vuzp1_f16(float16x4_t __p0, float16x4_t __p1) {
  65566   float16x4_t __ret;
  65567   __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6);
  65568   return __ret;
  65569 }
  65570 #else
  65571 __ai __attribute__((target("neon"))) float16x4_t vuzp1_f16(float16x4_t __p0, float16x4_t __p1) {
  65572   float16x4_t __ret;
  65573   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65574   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65575   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6);
  65576   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65577   return __ret;
  65578 }
  65579 #endif
  65580 
  65581 #ifdef __LITTLE_ENDIAN__
  65582 __ai __attribute__((target("neon"))) poly8x8_t vuzp2_p8(poly8x8_t __p0, poly8x8_t __p1) {
  65583   poly8x8_t __ret;
  65584   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65585   return __ret;
  65586 }
  65587 #else
  65588 __ai __attribute__((target("neon"))) poly8x8_t vuzp2_p8(poly8x8_t __p0, poly8x8_t __p1) {
  65589   poly8x8_t __ret;
  65590   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65591   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65592   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65593   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65594   return __ret;
  65595 }
  65596 #endif
  65597 
  65598 #ifdef __LITTLE_ENDIAN__
  65599 __ai __attribute__((target("neon"))) poly16x4_t vuzp2_p16(poly16x4_t __p0, poly16x4_t __p1) {
  65600   poly16x4_t __ret;
  65601   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65602   return __ret;
  65603 }
  65604 #else
  65605 __ai __attribute__((target("neon"))) poly16x4_t vuzp2_p16(poly16x4_t __p0, poly16x4_t __p1) {
  65606   poly16x4_t __ret;
  65607   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65608   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65609   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65610   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65611   return __ret;
  65612 }
  65613 #endif
  65614 
  65615 #ifdef __LITTLE_ENDIAN__
  65616 __ai __attribute__((target("neon"))) poly8x16_t vuzp2q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  65617   poly8x16_t __ret;
  65618   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31);
  65619   return __ret;
  65620 }
  65621 #else
  65622 __ai __attribute__((target("neon"))) poly8x16_t vuzp2q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  65623   poly8x16_t __ret;
  65624   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65625   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65626   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31);
  65627   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65628   return __ret;
  65629 }
  65630 #endif
  65631 
  65632 #ifdef __LITTLE_ENDIAN__
  65633 __ai __attribute__((target("neon"))) poly64x2_t vuzp2q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  65634   poly64x2_t __ret;
  65635   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65636   return __ret;
  65637 }
  65638 #else
  65639 __ai __attribute__((target("neon"))) poly64x2_t vuzp2q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  65640   poly64x2_t __ret;
  65641   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65642   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65643   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65644   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65645   return __ret;
  65646 }
  65647 #endif
  65648 
  65649 #ifdef __LITTLE_ENDIAN__
  65650 __ai __attribute__((target("neon"))) poly16x8_t vuzp2q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  65651   poly16x8_t __ret;
  65652   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65653   return __ret;
  65654 }
  65655 #else
  65656 __ai __attribute__((target("neon"))) poly16x8_t vuzp2q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  65657   poly16x8_t __ret;
  65658   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65659   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65660   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65661   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65662   return __ret;
  65663 }
  65664 #endif
  65665 
  65666 #ifdef __LITTLE_ENDIAN__
  65667 __ai __attribute__((target("neon"))) uint8x16_t vuzp2q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  65668   uint8x16_t __ret;
  65669   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31);
  65670   return __ret;
  65671 }
  65672 #else
  65673 __ai __attribute__((target("neon"))) uint8x16_t vuzp2q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  65674   uint8x16_t __ret;
  65675   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65676   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65677   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31);
  65678   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65679   return __ret;
  65680 }
  65681 #endif
  65682 
  65683 #ifdef __LITTLE_ENDIAN__
  65684 __ai __attribute__((target("neon"))) uint32x4_t vuzp2q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  65685   uint32x4_t __ret;
  65686   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65687   return __ret;
  65688 }
  65689 #else
  65690 __ai __attribute__((target("neon"))) uint32x4_t vuzp2q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  65691   uint32x4_t __ret;
  65692   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65693   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65694   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65695   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65696   return __ret;
  65697 }
  65698 #endif
  65699 
  65700 #ifdef __LITTLE_ENDIAN__
  65701 __ai __attribute__((target("neon"))) uint64x2_t vuzp2q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  65702   uint64x2_t __ret;
  65703   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65704   return __ret;
  65705 }
  65706 #else
  65707 __ai __attribute__((target("neon"))) uint64x2_t vuzp2q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  65708   uint64x2_t __ret;
  65709   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65710   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65711   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65712   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65713   return __ret;
  65714 }
  65715 #endif
  65716 
  65717 #ifdef __LITTLE_ENDIAN__
  65718 __ai __attribute__((target("neon"))) uint16x8_t vuzp2q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  65719   uint16x8_t __ret;
  65720   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65721   return __ret;
  65722 }
  65723 #else
  65724 __ai __attribute__((target("neon"))) uint16x8_t vuzp2q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  65725   uint16x8_t __ret;
  65726   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65727   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65728   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65729   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65730   return __ret;
  65731 }
  65732 #endif
  65733 
  65734 #ifdef __LITTLE_ENDIAN__
  65735 __ai __attribute__((target("neon"))) int8x16_t vuzp2q_s8(int8x16_t __p0, int8x16_t __p1) {
  65736   int8x16_t __ret;
  65737   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31);
  65738   return __ret;
  65739 }
  65740 #else
  65741 __ai __attribute__((target("neon"))) int8x16_t vuzp2q_s8(int8x16_t __p0, int8x16_t __p1) {
  65742   int8x16_t __ret;
  65743   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65744   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65745   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31);
  65746   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  65747   return __ret;
  65748 }
  65749 #endif
  65750 
  65751 #ifdef __LITTLE_ENDIAN__
  65752 __ai __attribute__((target("neon"))) float64x2_t vuzp2q_f64(float64x2_t __p0, float64x2_t __p1) {
  65753   float64x2_t __ret;
  65754   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65755   return __ret;
  65756 }
  65757 #else
  65758 __ai __attribute__((target("neon"))) float64x2_t vuzp2q_f64(float64x2_t __p0, float64x2_t __p1) {
  65759   float64x2_t __ret;
  65760   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65761   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65762   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65763   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65764   return __ret;
  65765 }
  65766 #endif
  65767 
  65768 #ifdef __LITTLE_ENDIAN__
  65769 __ai __attribute__((target("neon"))) float32x4_t vuzp2q_f32(float32x4_t __p0, float32x4_t __p1) {
  65770   float32x4_t __ret;
  65771   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65772   return __ret;
  65773 }
  65774 #else
  65775 __ai __attribute__((target("neon"))) float32x4_t vuzp2q_f32(float32x4_t __p0, float32x4_t __p1) {
  65776   float32x4_t __ret;
  65777   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65778   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65779   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65780   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65781   return __ret;
  65782 }
  65783 #endif
  65784 
  65785 #ifdef __LITTLE_ENDIAN__
  65786 __ai __attribute__((target("neon"))) int32x4_t vuzp2q_s32(int32x4_t __p0, int32x4_t __p1) {
  65787   int32x4_t __ret;
  65788   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65789   return __ret;
  65790 }
  65791 #else
  65792 __ai __attribute__((target("neon"))) int32x4_t vuzp2q_s32(int32x4_t __p0, int32x4_t __p1) {
  65793   int32x4_t __ret;
  65794   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65795   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65796   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65797   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65798   return __ret;
  65799 }
  65800 #endif
  65801 
  65802 #ifdef __LITTLE_ENDIAN__
  65803 __ai __attribute__((target("neon"))) int64x2_t vuzp2q_s64(int64x2_t __p0, int64x2_t __p1) {
  65804   int64x2_t __ret;
  65805   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65806   return __ret;
  65807 }
  65808 #else
  65809 __ai __attribute__((target("neon"))) int64x2_t vuzp2q_s64(int64x2_t __p0, int64x2_t __p1) {
  65810   int64x2_t __ret;
  65811   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65812   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65813   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65814   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65815   return __ret;
  65816 }
  65817 #endif
  65818 
  65819 #ifdef __LITTLE_ENDIAN__
  65820 __ai __attribute__((target("neon"))) int16x8_t vuzp2q_s16(int16x8_t __p0, int16x8_t __p1) {
  65821   int16x8_t __ret;
  65822   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65823   return __ret;
  65824 }
  65825 #else
  65826 __ai __attribute__((target("neon"))) int16x8_t vuzp2q_s16(int16x8_t __p0, int16x8_t __p1) {
  65827   int16x8_t __ret;
  65828   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65829   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65830   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65831   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65832   return __ret;
  65833 }
  65834 #endif
  65835 
  65836 #ifdef __LITTLE_ENDIAN__
  65837 __ai __attribute__((target("neon"))) uint8x8_t vuzp2_u8(uint8x8_t __p0, uint8x8_t __p1) {
  65838   uint8x8_t __ret;
  65839   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65840   return __ret;
  65841 }
  65842 #else
  65843 __ai __attribute__((target("neon"))) uint8x8_t vuzp2_u8(uint8x8_t __p0, uint8x8_t __p1) {
  65844   uint8x8_t __ret;
  65845   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65846   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65847   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65848   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65849   return __ret;
  65850 }
  65851 #endif
  65852 
  65853 #ifdef __LITTLE_ENDIAN__
  65854 __ai __attribute__((target("neon"))) uint32x2_t vuzp2_u32(uint32x2_t __p0, uint32x2_t __p1) {
  65855   uint32x2_t __ret;
  65856   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65857   return __ret;
  65858 }
  65859 #else
  65860 __ai __attribute__((target("neon"))) uint32x2_t vuzp2_u32(uint32x2_t __p0, uint32x2_t __p1) {
  65861   uint32x2_t __ret;
  65862   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65863   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65864   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65865   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65866   return __ret;
  65867 }
  65868 #endif
  65869 
  65870 #ifdef __LITTLE_ENDIAN__
  65871 __ai __attribute__((target("neon"))) uint16x4_t vuzp2_u16(uint16x4_t __p0, uint16x4_t __p1) {
  65872   uint16x4_t __ret;
  65873   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65874   return __ret;
  65875 }
  65876 #else
  65877 __ai __attribute__((target("neon"))) uint16x4_t vuzp2_u16(uint16x4_t __p0, uint16x4_t __p1) {
  65878   uint16x4_t __ret;
  65879   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65880   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65881   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65882   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65883   return __ret;
  65884 }
  65885 #endif
  65886 
  65887 #ifdef __LITTLE_ENDIAN__
  65888 __ai __attribute__((target("neon"))) int8x8_t vuzp2_s8(int8x8_t __p0, int8x8_t __p1) {
  65889   int8x8_t __ret;
  65890   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65891   return __ret;
  65892 }
  65893 #else
  65894 __ai __attribute__((target("neon"))) int8x8_t vuzp2_s8(int8x8_t __p0, int8x8_t __p1) {
  65895   int8x8_t __ret;
  65896   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65897   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65898   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65899   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65900   return __ret;
  65901 }
  65902 #endif
  65903 
  65904 #ifdef __LITTLE_ENDIAN__
  65905 __ai __attribute__((target("neon"))) float32x2_t vuzp2_f32(float32x2_t __p0, float32x2_t __p1) {
  65906   float32x2_t __ret;
  65907   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65908   return __ret;
  65909 }
  65910 #else
  65911 __ai __attribute__((target("neon"))) float32x2_t vuzp2_f32(float32x2_t __p0, float32x2_t __p1) {
  65912   float32x2_t __ret;
  65913   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65914   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65915   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65916   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65917   return __ret;
  65918 }
  65919 #endif
  65920 
  65921 #ifdef __LITTLE_ENDIAN__
  65922 __ai __attribute__((target("neon"))) int32x2_t vuzp2_s32(int32x2_t __p0, int32x2_t __p1) {
  65923   int32x2_t __ret;
  65924   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  65925   return __ret;
  65926 }
  65927 #else
  65928 __ai __attribute__((target("neon"))) int32x2_t vuzp2_s32(int32x2_t __p0, int32x2_t __p1) {
  65929   int32x2_t __ret;
  65930   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  65931   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  65932   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  65933   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  65934   return __ret;
  65935 }
  65936 #endif
  65937 
  65938 #ifdef __LITTLE_ENDIAN__
  65939 __ai __attribute__((target("neon"))) int16x4_t vuzp2_s16(int16x4_t __p0, int16x4_t __p1) {
  65940   int16x4_t __ret;
  65941   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65942   return __ret;
  65943 }
  65944 #else
  65945 __ai __attribute__((target("neon"))) int16x4_t vuzp2_s16(int16x4_t __p0, int16x4_t __p1) {
  65946   int16x4_t __ret;
  65947   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65948   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65949   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65950   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65951   return __ret;
  65952 }
  65953 #endif
  65954 
  65955 #ifdef __LITTLE_ENDIAN__
  65956 __ai __attribute__((target("neon"))) float16x8_t vuzp2q_f16(float16x8_t __p0, float16x8_t __p1) {
  65957   float16x8_t __ret;
  65958   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15);
  65959   return __ret;
  65960 }
  65961 #else
  65962 __ai __attribute__((target("neon"))) float16x8_t vuzp2q_f16(float16x8_t __p0, float16x8_t __p1) {
  65963   float16x8_t __ret;
  65964   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65965   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  65966   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15);
  65967   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  65968   return __ret;
  65969 }
  65970 #endif
  65971 
  65972 #ifdef __LITTLE_ENDIAN__
  65973 __ai __attribute__((target("neon"))) float16x4_t vuzp2_f16(float16x4_t __p0, float16x4_t __p1) {
  65974   float16x4_t __ret;
  65975   __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7);
  65976   return __ret;
  65977 }
  65978 #else
  65979 __ai __attribute__((target("neon"))) float16x4_t vuzp2_f16(float16x4_t __p0, float16x4_t __p1) {
  65980   float16x4_t __ret;
  65981   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  65982   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  65983   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7);
  65984   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  65985   return __ret;
  65986 }
  65987 #endif
  65988 
  65989 #ifdef __LITTLE_ENDIAN__
  65990 __ai __attribute__((target("neon"))) poly8x8_t vzip1_p8(poly8x8_t __p0, poly8x8_t __p1) {
  65991   poly8x8_t __ret;
  65992   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  65993   return __ret;
  65994 }
  65995 #else
  65996 __ai __attribute__((target("neon"))) poly8x8_t vzip1_p8(poly8x8_t __p0, poly8x8_t __p1) {
  65997   poly8x8_t __ret;
  65998   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  65999   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66000   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66001   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66002   return __ret;
  66003 }
  66004 #endif
  66005 
  66006 #ifdef __LITTLE_ENDIAN__
  66007 __ai __attribute__((target("neon"))) poly16x4_t vzip1_p16(poly16x4_t __p0, poly16x4_t __p1) {
  66008   poly16x4_t __ret;
  66009   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66010   return __ret;
  66011 }
  66012 #else
  66013 __ai __attribute__((target("neon"))) poly16x4_t vzip1_p16(poly16x4_t __p0, poly16x4_t __p1) {
  66014   poly16x4_t __ret;
  66015   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66016   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66017   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66018   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66019   return __ret;
  66020 }
  66021 #endif
  66022 
  66023 #ifdef __LITTLE_ENDIAN__
  66024 __ai __attribute__((target("neon"))) poly8x16_t vzip1q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  66025   poly8x16_t __ret;
  66026   __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23);
  66027   return __ret;
  66028 }
  66029 #else
  66030 __ai __attribute__((target("neon"))) poly8x16_t vzip1q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  66031   poly8x16_t __ret;
  66032   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66033   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66034   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23);
  66035   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66036   return __ret;
  66037 }
  66038 #endif
  66039 
  66040 #ifdef __LITTLE_ENDIAN__
  66041 __ai __attribute__((target("neon"))) poly64x2_t vzip1q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  66042   poly64x2_t __ret;
  66043   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66044   return __ret;
  66045 }
  66046 #else
  66047 __ai __attribute__((target("neon"))) poly64x2_t vzip1q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  66048   poly64x2_t __ret;
  66049   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66050   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66051   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66052   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66053   return __ret;
  66054 }
  66055 #endif
  66056 
  66057 #ifdef __LITTLE_ENDIAN__
  66058 __ai __attribute__((target("neon"))) poly16x8_t vzip1q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  66059   poly16x8_t __ret;
  66060   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  66061   return __ret;
  66062 }
  66063 #else
  66064 __ai __attribute__((target("neon"))) poly16x8_t vzip1q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  66065   poly16x8_t __ret;
  66066   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66067   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66068   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66069   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66070   return __ret;
  66071 }
  66072 #endif
  66073 
  66074 #ifdef __LITTLE_ENDIAN__
  66075 __ai __attribute__((target("neon"))) uint8x16_t vzip1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  66076   uint8x16_t __ret;
  66077   __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23);
  66078   return __ret;
  66079 }
  66080 #else
  66081 __ai __attribute__((target("neon"))) uint8x16_t vzip1q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  66082   uint8x16_t __ret;
  66083   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66084   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66085   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23);
  66086   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66087   return __ret;
  66088 }
  66089 #endif
  66090 
  66091 #ifdef __LITTLE_ENDIAN__
  66092 __ai __attribute__((target("neon"))) uint32x4_t vzip1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  66093   uint32x4_t __ret;
  66094   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66095   return __ret;
  66096 }
  66097 #else
  66098 __ai __attribute__((target("neon"))) uint32x4_t vzip1q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  66099   uint32x4_t __ret;
  66100   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66101   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66102   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66103   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66104   return __ret;
  66105 }
  66106 #endif
  66107 
  66108 #ifdef __LITTLE_ENDIAN__
  66109 __ai __attribute__((target("neon"))) uint64x2_t vzip1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  66110   uint64x2_t __ret;
  66111   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66112   return __ret;
  66113 }
  66114 #else
  66115 __ai __attribute__((target("neon"))) uint64x2_t vzip1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  66116   uint64x2_t __ret;
  66117   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66118   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66119   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66120   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66121   return __ret;
  66122 }
  66123 #endif
  66124 
  66125 #ifdef __LITTLE_ENDIAN__
  66126 __ai __attribute__((target("neon"))) uint16x8_t vzip1q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  66127   uint16x8_t __ret;
  66128   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  66129   return __ret;
  66130 }
  66131 #else
  66132 __ai __attribute__((target("neon"))) uint16x8_t vzip1q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  66133   uint16x8_t __ret;
  66134   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66135   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66136   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66137   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66138   return __ret;
  66139 }
  66140 #endif
  66141 
  66142 #ifdef __LITTLE_ENDIAN__
  66143 __ai __attribute__((target("neon"))) int8x16_t vzip1q_s8(int8x16_t __p0, int8x16_t __p1) {
  66144   int8x16_t __ret;
  66145   __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23);
  66146   return __ret;
  66147 }
  66148 #else
  66149 __ai __attribute__((target("neon"))) int8x16_t vzip1q_s8(int8x16_t __p0, int8x16_t __p1) {
  66150   int8x16_t __ret;
  66151   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66152   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66153   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23);
  66154   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66155   return __ret;
  66156 }
  66157 #endif
  66158 
  66159 #ifdef __LITTLE_ENDIAN__
  66160 __ai __attribute__((target("neon"))) float64x2_t vzip1q_f64(float64x2_t __p0, float64x2_t __p1) {
  66161   float64x2_t __ret;
  66162   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66163   return __ret;
  66164 }
  66165 #else
  66166 __ai __attribute__((target("neon"))) float64x2_t vzip1q_f64(float64x2_t __p0, float64x2_t __p1) {
  66167   float64x2_t __ret;
  66168   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66169   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66170   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66171   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66172   return __ret;
  66173 }
  66174 #endif
  66175 
  66176 #ifdef __LITTLE_ENDIAN__
  66177 __ai __attribute__((target("neon"))) float32x4_t vzip1q_f32(float32x4_t __p0, float32x4_t __p1) {
  66178   float32x4_t __ret;
  66179   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66180   return __ret;
  66181 }
  66182 #else
  66183 __ai __attribute__((target("neon"))) float32x4_t vzip1q_f32(float32x4_t __p0, float32x4_t __p1) {
  66184   float32x4_t __ret;
  66185   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66186   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66187   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66188   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66189   return __ret;
  66190 }
  66191 #endif
  66192 
  66193 #ifdef __LITTLE_ENDIAN__
  66194 __ai __attribute__((target("neon"))) int32x4_t vzip1q_s32(int32x4_t __p0, int32x4_t __p1) {
  66195   int32x4_t __ret;
  66196   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66197   return __ret;
  66198 }
  66199 #else
  66200 __ai __attribute__((target("neon"))) int32x4_t vzip1q_s32(int32x4_t __p0, int32x4_t __p1) {
  66201   int32x4_t __ret;
  66202   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66203   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66204   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66205   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66206   return __ret;
  66207 }
  66208 #endif
  66209 
  66210 #ifdef __LITTLE_ENDIAN__
  66211 __ai __attribute__((target("neon"))) int64x2_t vzip1q_s64(int64x2_t __p0, int64x2_t __p1) {
  66212   int64x2_t __ret;
  66213   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66214   return __ret;
  66215 }
  66216 #else
  66217 __ai __attribute__((target("neon"))) int64x2_t vzip1q_s64(int64x2_t __p0, int64x2_t __p1) {
  66218   int64x2_t __ret;
  66219   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66220   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66221   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66222   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66223   return __ret;
  66224 }
  66225 #endif
  66226 
  66227 #ifdef __LITTLE_ENDIAN__
  66228 __ai __attribute__((target("neon"))) int16x8_t vzip1q_s16(int16x8_t __p0, int16x8_t __p1) {
  66229   int16x8_t __ret;
  66230   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  66231   return __ret;
  66232 }
  66233 #else
  66234 __ai __attribute__((target("neon"))) int16x8_t vzip1q_s16(int16x8_t __p0, int16x8_t __p1) {
  66235   int16x8_t __ret;
  66236   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66237   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66238   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66239   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66240   return __ret;
  66241 }
  66242 #endif
  66243 
  66244 #ifdef __LITTLE_ENDIAN__
  66245 __ai __attribute__((target("neon"))) uint8x8_t vzip1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  66246   uint8x8_t __ret;
  66247   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  66248   return __ret;
  66249 }
  66250 #else
  66251 __ai __attribute__((target("neon"))) uint8x8_t vzip1_u8(uint8x8_t __p0, uint8x8_t __p1) {
  66252   uint8x8_t __ret;
  66253   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66254   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66255   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66256   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66257   return __ret;
  66258 }
  66259 #endif
  66260 
  66261 #ifdef __LITTLE_ENDIAN__
  66262 __ai __attribute__((target("neon"))) uint32x2_t vzip1_u32(uint32x2_t __p0, uint32x2_t __p1) {
  66263   uint32x2_t __ret;
  66264   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66265   return __ret;
  66266 }
  66267 #else
  66268 __ai __attribute__((target("neon"))) uint32x2_t vzip1_u32(uint32x2_t __p0, uint32x2_t __p1) {
  66269   uint32x2_t __ret;
  66270   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66271   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66272   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66273   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66274   return __ret;
  66275 }
  66276 #endif
  66277 
  66278 #ifdef __LITTLE_ENDIAN__
  66279 __ai __attribute__((target("neon"))) uint16x4_t vzip1_u16(uint16x4_t __p0, uint16x4_t __p1) {
  66280   uint16x4_t __ret;
  66281   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66282   return __ret;
  66283 }
  66284 #else
  66285 __ai __attribute__((target("neon"))) uint16x4_t vzip1_u16(uint16x4_t __p0, uint16x4_t __p1) {
  66286   uint16x4_t __ret;
  66287   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66288   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66289   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66290   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66291   return __ret;
  66292 }
  66293 #endif
  66294 
  66295 #ifdef __LITTLE_ENDIAN__
  66296 __ai __attribute__((target("neon"))) int8x8_t vzip1_s8(int8x8_t __p0, int8x8_t __p1) {
  66297   int8x8_t __ret;
  66298   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  66299   return __ret;
  66300 }
  66301 #else
  66302 __ai __attribute__((target("neon"))) int8x8_t vzip1_s8(int8x8_t __p0, int8x8_t __p1) {
  66303   int8x8_t __ret;
  66304   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66305   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66306   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66307   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66308   return __ret;
  66309 }
  66310 #endif
  66311 
  66312 #ifdef __LITTLE_ENDIAN__
  66313 __ai __attribute__((target("neon"))) float32x2_t vzip1_f32(float32x2_t __p0, float32x2_t __p1) {
  66314   float32x2_t __ret;
  66315   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66316   return __ret;
  66317 }
  66318 #else
  66319 __ai __attribute__((target("neon"))) float32x2_t vzip1_f32(float32x2_t __p0, float32x2_t __p1) {
  66320   float32x2_t __ret;
  66321   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66322   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66323   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66324   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66325   return __ret;
  66326 }
  66327 #endif
  66328 
  66329 #ifdef __LITTLE_ENDIAN__
  66330 __ai __attribute__((target("neon"))) int32x2_t vzip1_s32(int32x2_t __p0, int32x2_t __p1) {
  66331   int32x2_t __ret;
  66332   __ret = __builtin_shufflevector(__p0, __p1, 0, 2);
  66333   return __ret;
  66334 }
  66335 #else
  66336 __ai __attribute__((target("neon"))) int32x2_t vzip1_s32(int32x2_t __p0, int32x2_t __p1) {
  66337   int32x2_t __ret;
  66338   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66339   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66340   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2);
  66341   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66342   return __ret;
  66343 }
  66344 #endif
  66345 
  66346 #ifdef __LITTLE_ENDIAN__
  66347 __ai __attribute__((target("neon"))) int16x4_t vzip1_s16(int16x4_t __p0, int16x4_t __p1) {
  66348   int16x4_t __ret;
  66349   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66350   return __ret;
  66351 }
  66352 #else
  66353 __ai __attribute__((target("neon"))) int16x4_t vzip1_s16(int16x4_t __p0, int16x4_t __p1) {
  66354   int16x4_t __ret;
  66355   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66356   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66357   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66358   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66359   return __ret;
  66360 }
  66361 #endif
  66362 
  66363 #ifdef __LITTLE_ENDIAN__
  66364 __ai __attribute__((target("neon"))) float16x8_t vzip1q_f16(float16x8_t __p0, float16x8_t __p1) {
  66365   float16x8_t __ret;
  66366   __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11);
  66367   return __ret;
  66368 }
  66369 #else
  66370 __ai __attribute__((target("neon"))) float16x8_t vzip1q_f16(float16x8_t __p0, float16x8_t __p1) {
  66371   float16x8_t __ret;
  66372   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66373   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66374   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11);
  66375   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66376   return __ret;
  66377 }
  66378 #endif
  66379 
  66380 #ifdef __LITTLE_ENDIAN__
  66381 __ai __attribute__((target("neon"))) float16x4_t vzip1_f16(float16x4_t __p0, float16x4_t __p1) {
  66382   float16x4_t __ret;
  66383   __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5);
  66384   return __ret;
  66385 }
  66386 #else
  66387 __ai __attribute__((target("neon"))) float16x4_t vzip1_f16(float16x4_t __p0, float16x4_t __p1) {
  66388   float16x4_t __ret;
  66389   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66390   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66391   __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5);
  66392   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66393   return __ret;
  66394 }
  66395 #endif
  66396 
  66397 #ifdef __LITTLE_ENDIAN__
  66398 __ai __attribute__((target("neon"))) poly8x8_t vzip2_p8(poly8x8_t __p0, poly8x8_t __p1) {
  66399   poly8x8_t __ret;
  66400   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66401   return __ret;
  66402 }
  66403 #else
  66404 __ai __attribute__((target("neon"))) poly8x8_t vzip2_p8(poly8x8_t __p0, poly8x8_t __p1) {
  66405   poly8x8_t __ret;
  66406   poly8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66407   poly8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66408   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66409   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66410   return __ret;
  66411 }
  66412 #endif
  66413 
  66414 #ifdef __LITTLE_ENDIAN__
  66415 __ai __attribute__((target("neon"))) poly16x4_t vzip2_p16(poly16x4_t __p0, poly16x4_t __p1) {
  66416   poly16x4_t __ret;
  66417   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66418   return __ret;
  66419 }
  66420 #else
  66421 __ai __attribute__((target("neon"))) poly16x4_t vzip2_p16(poly16x4_t __p0, poly16x4_t __p1) {
  66422   poly16x4_t __ret;
  66423   poly16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66424   poly16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66425   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66426   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66427   return __ret;
  66428 }
  66429 #endif
  66430 
  66431 #ifdef __LITTLE_ENDIAN__
  66432 __ai __attribute__((target("neon"))) poly8x16_t vzip2q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  66433   poly8x16_t __ret;
  66434   __ret = __builtin_shufflevector(__p0, __p1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31);
  66435   return __ret;
  66436 }
  66437 #else
  66438 __ai __attribute__((target("neon"))) poly8x16_t vzip2q_p8(poly8x16_t __p0, poly8x16_t __p1) {
  66439   poly8x16_t __ret;
  66440   poly8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66441   poly8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66442   __ret = __builtin_shufflevector(__rev0, __rev1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31);
  66443   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66444   return __ret;
  66445 }
  66446 #endif
  66447 
  66448 #ifdef __LITTLE_ENDIAN__
  66449 __ai __attribute__((target("neon"))) poly64x2_t vzip2q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  66450   poly64x2_t __ret;
  66451   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66452   return __ret;
  66453 }
  66454 #else
  66455 __ai __attribute__((target("neon"))) poly64x2_t vzip2q_p64(poly64x2_t __p0, poly64x2_t __p1) {
  66456   poly64x2_t __ret;
  66457   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66458   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66459   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66460   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66461   return __ret;
  66462 }
  66463 #endif
  66464 
  66465 #ifdef __LITTLE_ENDIAN__
  66466 __ai __attribute__((target("neon"))) poly16x8_t vzip2q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  66467   poly16x8_t __ret;
  66468   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66469   return __ret;
  66470 }
  66471 #else
  66472 __ai __attribute__((target("neon"))) poly16x8_t vzip2q_p16(poly16x8_t __p0, poly16x8_t __p1) {
  66473   poly16x8_t __ret;
  66474   poly16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66475   poly16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66476   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66477   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66478   return __ret;
  66479 }
  66480 #endif
  66481 
  66482 #ifdef __LITTLE_ENDIAN__
  66483 __ai __attribute__((target("neon"))) uint8x16_t vzip2q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  66484   uint8x16_t __ret;
  66485   __ret = __builtin_shufflevector(__p0, __p1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31);
  66486   return __ret;
  66487 }
  66488 #else
  66489 __ai __attribute__((target("neon"))) uint8x16_t vzip2q_u8(uint8x16_t __p0, uint8x16_t __p1) {
  66490   uint8x16_t __ret;
  66491   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66492   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66493   __ret = __builtin_shufflevector(__rev0, __rev1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31);
  66494   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66495   return __ret;
  66496 }
  66497 #endif
  66498 
  66499 #ifdef __LITTLE_ENDIAN__
  66500 __ai __attribute__((target("neon"))) uint32x4_t vzip2q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  66501   uint32x4_t __ret;
  66502   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66503   return __ret;
  66504 }
  66505 #else
  66506 __ai __attribute__((target("neon"))) uint32x4_t vzip2q_u32(uint32x4_t __p0, uint32x4_t __p1) {
  66507   uint32x4_t __ret;
  66508   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66509   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66510   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66511   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66512   return __ret;
  66513 }
  66514 #endif
  66515 
  66516 #ifdef __LITTLE_ENDIAN__
  66517 __ai __attribute__((target("neon"))) uint64x2_t vzip2q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  66518   uint64x2_t __ret;
  66519   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66520   return __ret;
  66521 }
  66522 #else
  66523 __ai __attribute__((target("neon"))) uint64x2_t vzip2q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  66524   uint64x2_t __ret;
  66525   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66526   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66527   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66528   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66529   return __ret;
  66530 }
  66531 #endif
  66532 
  66533 #ifdef __LITTLE_ENDIAN__
  66534 __ai __attribute__((target("neon"))) uint16x8_t vzip2q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  66535   uint16x8_t __ret;
  66536   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66537   return __ret;
  66538 }
  66539 #else
  66540 __ai __attribute__((target("neon"))) uint16x8_t vzip2q_u16(uint16x8_t __p0, uint16x8_t __p1) {
  66541   uint16x8_t __ret;
  66542   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66543   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66544   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66545   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66546   return __ret;
  66547 }
  66548 #endif
  66549 
  66550 #ifdef __LITTLE_ENDIAN__
  66551 __ai __attribute__((target("neon"))) int8x16_t vzip2q_s8(int8x16_t __p0, int8x16_t __p1) {
  66552   int8x16_t __ret;
  66553   __ret = __builtin_shufflevector(__p0, __p1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31);
  66554   return __ret;
  66555 }
  66556 #else
  66557 __ai __attribute__((target("neon"))) int8x16_t vzip2q_s8(int8x16_t __p0, int8x16_t __p1) {
  66558   int8x16_t __ret;
  66559   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66560   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66561   __ret = __builtin_shufflevector(__rev0, __rev1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31);
  66562   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66563   return __ret;
  66564 }
  66565 #endif
  66566 
  66567 #ifdef __LITTLE_ENDIAN__
  66568 __ai __attribute__((target("neon"))) float64x2_t vzip2q_f64(float64x2_t __p0, float64x2_t __p1) {
  66569   float64x2_t __ret;
  66570   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66571   return __ret;
  66572 }
  66573 #else
  66574 __ai __attribute__((target("neon"))) float64x2_t vzip2q_f64(float64x2_t __p0, float64x2_t __p1) {
  66575   float64x2_t __ret;
  66576   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66577   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66578   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66579   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66580   return __ret;
  66581 }
  66582 #endif
  66583 
  66584 #ifdef __LITTLE_ENDIAN__
  66585 __ai __attribute__((target("neon"))) float32x4_t vzip2q_f32(float32x4_t __p0, float32x4_t __p1) {
  66586   float32x4_t __ret;
  66587   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66588   return __ret;
  66589 }
  66590 #else
  66591 __ai __attribute__((target("neon"))) float32x4_t vzip2q_f32(float32x4_t __p0, float32x4_t __p1) {
  66592   float32x4_t __ret;
  66593   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66594   float32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66595   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66596   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66597   return __ret;
  66598 }
  66599 #endif
  66600 
  66601 #ifdef __LITTLE_ENDIAN__
  66602 __ai __attribute__((target("neon"))) int32x4_t vzip2q_s32(int32x4_t __p0, int32x4_t __p1) {
  66603   int32x4_t __ret;
  66604   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66605   return __ret;
  66606 }
  66607 #else
  66608 __ai __attribute__((target("neon"))) int32x4_t vzip2q_s32(int32x4_t __p0, int32x4_t __p1) {
  66609   int32x4_t __ret;
  66610   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66611   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66612   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66613   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66614   return __ret;
  66615 }
  66616 #endif
  66617 
  66618 #ifdef __LITTLE_ENDIAN__
  66619 __ai __attribute__((target("neon"))) int64x2_t vzip2q_s64(int64x2_t __p0, int64x2_t __p1) {
  66620   int64x2_t __ret;
  66621   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66622   return __ret;
  66623 }
  66624 #else
  66625 __ai __attribute__((target("neon"))) int64x2_t vzip2q_s64(int64x2_t __p0, int64x2_t __p1) {
  66626   int64x2_t __ret;
  66627   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66628   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66629   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66630   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66631   return __ret;
  66632 }
  66633 #endif
  66634 
  66635 #ifdef __LITTLE_ENDIAN__
  66636 __ai __attribute__((target("neon"))) int16x8_t vzip2q_s16(int16x8_t __p0, int16x8_t __p1) {
  66637   int16x8_t __ret;
  66638   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66639   return __ret;
  66640 }
  66641 #else
  66642 __ai __attribute__((target("neon"))) int16x8_t vzip2q_s16(int16x8_t __p0, int16x8_t __p1) {
  66643   int16x8_t __ret;
  66644   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66645   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66646   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66647   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66648   return __ret;
  66649 }
  66650 #endif
  66651 
  66652 #ifdef __LITTLE_ENDIAN__
  66653 __ai __attribute__((target("neon"))) uint8x8_t vzip2_u8(uint8x8_t __p0, uint8x8_t __p1) {
  66654   uint8x8_t __ret;
  66655   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66656   return __ret;
  66657 }
  66658 #else
  66659 __ai __attribute__((target("neon"))) uint8x8_t vzip2_u8(uint8x8_t __p0, uint8x8_t __p1) {
  66660   uint8x8_t __ret;
  66661   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66662   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66663   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66664   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66665   return __ret;
  66666 }
  66667 #endif
  66668 
  66669 #ifdef __LITTLE_ENDIAN__
  66670 __ai __attribute__((target("neon"))) uint32x2_t vzip2_u32(uint32x2_t __p0, uint32x2_t __p1) {
  66671   uint32x2_t __ret;
  66672   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66673   return __ret;
  66674 }
  66675 #else
  66676 __ai __attribute__((target("neon"))) uint32x2_t vzip2_u32(uint32x2_t __p0, uint32x2_t __p1) {
  66677   uint32x2_t __ret;
  66678   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66679   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66680   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66681   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66682   return __ret;
  66683 }
  66684 #endif
  66685 
  66686 #ifdef __LITTLE_ENDIAN__
  66687 __ai __attribute__((target("neon"))) uint16x4_t vzip2_u16(uint16x4_t __p0, uint16x4_t __p1) {
  66688   uint16x4_t __ret;
  66689   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66690   return __ret;
  66691 }
  66692 #else
  66693 __ai __attribute__((target("neon"))) uint16x4_t vzip2_u16(uint16x4_t __p0, uint16x4_t __p1) {
  66694   uint16x4_t __ret;
  66695   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66696   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66697   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66698   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66699   return __ret;
  66700 }
  66701 #endif
  66702 
  66703 #ifdef __LITTLE_ENDIAN__
  66704 __ai __attribute__((target("neon"))) int8x8_t vzip2_s8(int8x8_t __p0, int8x8_t __p1) {
  66705   int8x8_t __ret;
  66706   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66707   return __ret;
  66708 }
  66709 #else
  66710 __ai __attribute__((target("neon"))) int8x8_t vzip2_s8(int8x8_t __p0, int8x8_t __p1) {
  66711   int8x8_t __ret;
  66712   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66713   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66714   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66715   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66716   return __ret;
  66717 }
  66718 #endif
  66719 
  66720 #ifdef __LITTLE_ENDIAN__
  66721 __ai __attribute__((target("neon"))) float32x2_t vzip2_f32(float32x2_t __p0, float32x2_t __p1) {
  66722   float32x2_t __ret;
  66723   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66724   return __ret;
  66725 }
  66726 #else
  66727 __ai __attribute__((target("neon"))) float32x2_t vzip2_f32(float32x2_t __p0, float32x2_t __p1) {
  66728   float32x2_t __ret;
  66729   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66730   float32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66731   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66732   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66733   return __ret;
  66734 }
  66735 #endif
  66736 
  66737 #ifdef __LITTLE_ENDIAN__
  66738 __ai __attribute__((target("neon"))) int32x2_t vzip2_s32(int32x2_t __p0, int32x2_t __p1) {
  66739   int32x2_t __ret;
  66740   __ret = __builtin_shufflevector(__p0, __p1, 1, 3);
  66741   return __ret;
  66742 }
  66743 #else
  66744 __ai __attribute__((target("neon"))) int32x2_t vzip2_s32(int32x2_t __p0, int32x2_t __p1) {
  66745   int32x2_t __ret;
  66746   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  66747   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  66748   __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3);
  66749   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  66750   return __ret;
  66751 }
  66752 #endif
  66753 
  66754 #ifdef __LITTLE_ENDIAN__
  66755 __ai __attribute__((target("neon"))) int16x4_t vzip2_s16(int16x4_t __p0, int16x4_t __p1) {
  66756   int16x4_t __ret;
  66757   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66758   return __ret;
  66759 }
  66760 #else
  66761 __ai __attribute__((target("neon"))) int16x4_t vzip2_s16(int16x4_t __p0, int16x4_t __p1) {
  66762   int16x4_t __ret;
  66763   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66764   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66765   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66766   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66767   return __ret;
  66768 }
  66769 #endif
  66770 
  66771 #ifdef __LITTLE_ENDIAN__
  66772 __ai __attribute__((target("neon"))) float16x8_t vzip2q_f16(float16x8_t __p0, float16x8_t __p1) {
  66773   float16x8_t __ret;
  66774   __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15);
  66775   return __ret;
  66776 }
  66777 #else
  66778 __ai __attribute__((target("neon"))) float16x8_t vzip2q_f16(float16x8_t __p0, float16x8_t __p1) {
  66779   float16x8_t __ret;
  66780   float16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  66781   float16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  66782   __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15);
  66783   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  66784   return __ret;
  66785 }
  66786 #endif
  66787 
  66788 #ifdef __LITTLE_ENDIAN__
  66789 __ai __attribute__((target("neon"))) float16x4_t vzip2_f16(float16x4_t __p0, float16x4_t __p1) {
  66790   float16x4_t __ret;
  66791   __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7);
  66792   return __ret;
  66793 }
  66794 #else
  66795 __ai __attribute__((target("neon"))) float16x4_t vzip2_f16(float16x4_t __p0, float16x4_t __p1) {
  66796   float16x4_t __ret;
  66797   float16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66798   float16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66799   __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7);
  66800   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  66801   return __ret;
  66802 }
  66803 #endif
  66804 
  66805 #define vldap1_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  66806   poly64x1_t __ret; \
  66807   poly64x1_t __s1 = __p1; \
  66808   __ret = (poly64x1_t) __builtin_neon_vldap1_lane_p64(__p0, (int8x8_t)__s1, __p2, 6); \
  66809   __ret; \
  66810 })
  66811 #ifdef __LITTLE_ENDIAN__
  66812 #define vldap1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  66813   poly64x2_t __ret; \
  66814   poly64x2_t __s1 = __p1; \
  66815   __ret = (poly64x2_t) __builtin_neon_vldap1q_lane_p64(__p0, (int8x16_t)__s1, __p2, 38); \
  66816   __ret; \
  66817 })
  66818 #else
  66819 #define vldap1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  66820   poly64x2_t __ret; \
  66821   poly64x2_t __s1 = __p1; \
  66822   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66823   __ret = (poly64x2_t) __builtin_neon_vldap1q_lane_p64(__p0, (int8x16_t)__rev1, __p2, 38); \
  66824   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  66825   __ret; \
  66826 })
  66827 #endif
  66828 
  66829 #ifdef __LITTLE_ENDIAN__
  66830 #define vldap1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  66831   uint64x2_t __ret; \
  66832   uint64x2_t __s1 = __p1; \
  66833   __ret = (uint64x2_t) __builtin_neon_vldap1q_lane_u64(__p0, (int8x16_t)__s1, __p2, 51); \
  66834   __ret; \
  66835 })
  66836 #else
  66837 #define vldap1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  66838   uint64x2_t __ret; \
  66839   uint64x2_t __s1 = __p1; \
  66840   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66841   __ret = (uint64x2_t) __builtin_neon_vldap1q_lane_u64(__p0, (int8x16_t)__rev1, __p2, 51); \
  66842   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  66843   __ret; \
  66844 })
  66845 #endif
  66846 
  66847 #ifdef __LITTLE_ENDIAN__
  66848 #define vldap1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  66849   float64x2_t __ret; \
  66850   float64x2_t __s1 = __p1; \
  66851   __ret = (float64x2_t) __builtin_neon_vldap1q_lane_f64(__p0, (int8x16_t)__s1, __p2, 42); \
  66852   __ret; \
  66853 })
  66854 #else
  66855 #define vldap1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  66856   float64x2_t __ret; \
  66857   float64x2_t __s1 = __p1; \
  66858   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66859   __ret = (float64x2_t) __builtin_neon_vldap1q_lane_f64(__p0, (int8x16_t)__rev1, __p2, 42); \
  66860   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  66861   __ret; \
  66862 })
  66863 #endif
  66864 
  66865 #ifdef __LITTLE_ENDIAN__
  66866 #define vldap1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  66867   int64x2_t __ret; \
  66868   int64x2_t __s1 = __p1; \
  66869   __ret = (int64x2_t) __builtin_neon_vldap1q_lane_s64(__p0, (int8x16_t)__s1, __p2, 35); \
  66870   __ret; \
  66871 })
  66872 #else
  66873 #define vldap1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  66874   int64x2_t __ret; \
  66875   int64x2_t __s1 = __p1; \
  66876   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66877   __ret = (int64x2_t) __builtin_neon_vldap1q_lane_s64(__p0, (int8x16_t)__rev1, __p2, 35); \
  66878   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  66879   __ret; \
  66880 })
  66881 #endif
  66882 
  66883 #define vldap1_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  66884   uint64x1_t __ret; \
  66885   uint64x1_t __s1 = __p1; \
  66886   __ret = (uint64x1_t) __builtin_neon_vldap1_lane_u64(__p0, (int8x8_t)__s1, __p2, 19); \
  66887   __ret; \
  66888 })
  66889 #define vldap1_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  66890   float64x1_t __ret; \
  66891   float64x1_t __s1 = __p1; \
  66892   __ret = (float64x1_t) __builtin_neon_vldap1_lane_f64(__p0, (int8x8_t)__s1, __p2, 10); \
  66893   __ret; \
  66894 })
  66895 #define vldap1_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  66896   int64x1_t __ret; \
  66897   int64x1_t __s1 = __p1; \
  66898   __ret = (int64x1_t) __builtin_neon_vldap1_lane_s64(__p0, (int8x8_t)__s1, __p2, 3); \
  66899   __ret; \
  66900 })
  66901 #define vstl1_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  66902   poly64x1_t __s1 = __p1; \
  66903   __builtin_neon_vstl1_lane_p64(__p0, (int8x8_t)__s1, __p2, 6); \
  66904 })
  66905 #ifdef __LITTLE_ENDIAN__
  66906 #define vstl1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  66907   poly64x2_t __s1 = __p1; \
  66908   __builtin_neon_vstl1q_lane_p64(__p0, (int8x16_t)__s1, __p2, 38); \
  66909 })
  66910 #else
  66911 #define vstl1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \
  66912   poly64x2_t __s1 = __p1; \
  66913   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66914   __builtin_neon_vstl1q_lane_p64(__p0, (int8x16_t)__rev1, __p2, 38); \
  66915 })
  66916 #endif
  66917 
  66918 #ifdef __LITTLE_ENDIAN__
  66919 #define vstl1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  66920   uint64x2_t __s1 = __p1; \
  66921   __builtin_neon_vstl1q_lane_u64(__p0, (int8x16_t)__s1, __p2, 51); \
  66922 })
  66923 #else
  66924 #define vstl1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  66925   uint64x2_t __s1 = __p1; \
  66926   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66927   __builtin_neon_vstl1q_lane_u64(__p0, (int8x16_t)__rev1, __p2, 51); \
  66928 })
  66929 #endif
  66930 
  66931 #ifdef __LITTLE_ENDIAN__
  66932 #define vstl1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  66933   float64x2_t __s1 = __p1; \
  66934   __builtin_neon_vstl1q_lane_f64(__p0, (int8x16_t)__s1, __p2, 42); \
  66935 })
  66936 #else
  66937 #define vstl1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  66938   float64x2_t __s1 = __p1; \
  66939   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66940   __builtin_neon_vstl1q_lane_f64(__p0, (int8x16_t)__rev1, __p2, 42); \
  66941 })
  66942 #endif
  66943 
  66944 #ifdef __LITTLE_ENDIAN__
  66945 #define vstl1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  66946   int64x2_t __s1 = __p1; \
  66947   __builtin_neon_vstl1q_lane_s64(__p0, (int8x16_t)__s1, __p2, 35); \
  66948 })
  66949 #else
  66950 #define vstl1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  66951   int64x2_t __s1 = __p1; \
  66952   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  66953   __builtin_neon_vstl1q_lane_s64(__p0, (int8x16_t)__rev1, __p2, 35); \
  66954 })
  66955 #endif
  66956 
  66957 #define vstl1_lane_u64(__p0, __p1, __p2) __extension__ ({ \
  66958   uint64x1_t __s1 = __p1; \
  66959   __builtin_neon_vstl1_lane_u64(__p0, (int8x8_t)__s1, __p2, 19); \
  66960 })
  66961 #define vstl1_lane_f64(__p0, __p1, __p2) __extension__ ({ \
  66962   float64x1_t __s1 = __p1; \
  66963   __builtin_neon_vstl1_lane_f64(__p0, (int8x8_t)__s1, __p2, 10); \
  66964 })
  66965 #define vstl1_lane_s64(__p0, __p1, __p2) __extension__ ({ \
  66966   int64x1_t __s1 = __p1; \
  66967   __builtin_neon_vstl1_lane_s64(__p0, (int8x8_t)__s1, __p2, 3); \
  66968 })
  66969 #ifdef __LITTLE_ENDIAN__
  66970 __ai __attribute__((target("sha3,neon"))) uint8x16_t vbcaxq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  66971   uint8x16_t __ret;
  66972   __ret = (uint8x16_t) __builtin_neon_vbcaxq_u8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48);
  66973   return __ret;
  66974 }
  66975 #else
  66976 __ai __attribute__((target("sha3,neon"))) uint8x16_t vbcaxq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  66977   uint8x16_t __ret;
  66978   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66979   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66980   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66981   __ret = (uint8x16_t) __builtin_neon_vbcaxq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48);
  66982   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  66983   return __ret;
  66984 }
  66985 #endif
  66986 
  66987 #ifdef __LITTLE_ENDIAN__
  66988 __ai __attribute__((target("sha3,neon"))) uint32x4_t vbcaxq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  66989   uint32x4_t __ret;
  66990   __ret = (uint32x4_t) __builtin_neon_vbcaxq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  66991   return __ret;
  66992 }
  66993 #else
  66994 __ai __attribute__((target("sha3,neon"))) uint32x4_t vbcaxq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  66995   uint32x4_t __ret;
  66996   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  66997   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  66998   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  66999   __ret = (uint32x4_t) __builtin_neon_vbcaxq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  67000   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67001   return __ret;
  67002 }
  67003 #endif
  67004 
  67005 #ifdef __LITTLE_ENDIAN__
  67006 __ai __attribute__((target("sha3,neon"))) uint64x2_t vbcaxq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67007   uint64x2_t __ret;
  67008   __ret = (uint64x2_t) __builtin_neon_vbcaxq_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51);
  67009   return __ret;
  67010 }
  67011 #else
  67012 __ai __attribute__((target("sha3,neon"))) uint64x2_t vbcaxq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67013   uint64x2_t __ret;
  67014   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67015   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67016   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67017   __ret = (uint64x2_t) __builtin_neon_vbcaxq_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51);
  67018   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67019   return __ret;
  67020 }
  67021 #endif
  67022 
  67023 #ifdef __LITTLE_ENDIAN__
  67024 __ai __attribute__((target("sha3,neon"))) uint16x8_t vbcaxq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  67025   uint16x8_t __ret;
  67026   __ret = (uint16x8_t) __builtin_neon_vbcaxq_u16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 49);
  67027   return __ret;
  67028 }
  67029 #else
  67030 __ai __attribute__((target("sha3,neon"))) uint16x8_t vbcaxq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  67031   uint16x8_t __ret;
  67032   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  67033   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  67034   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  67035   __ret = (uint16x8_t) __builtin_neon_vbcaxq_u16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 49);
  67036   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  67037   return __ret;
  67038 }
  67039 #endif
  67040 
  67041 #ifdef __LITTLE_ENDIAN__
  67042 __ai __attribute__((target("sha3,neon"))) int8x16_t vbcaxq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  67043   int8x16_t __ret;
  67044   __ret = (int8x16_t) __builtin_neon_vbcaxq_s8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32);
  67045   return __ret;
  67046 }
  67047 #else
  67048 __ai __attribute__((target("sha3,neon"))) int8x16_t vbcaxq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  67049   int8x16_t __ret;
  67050   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67051   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67052   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67053   __ret = (int8x16_t) __builtin_neon_vbcaxq_s8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32);
  67054   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67055   return __ret;
  67056 }
  67057 #endif
  67058 
  67059 #ifdef __LITTLE_ENDIAN__
  67060 __ai __attribute__((target("sha3,neon"))) int32x4_t vbcaxq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  67061   int32x4_t __ret;
  67062   __ret = (int32x4_t) __builtin_neon_vbcaxq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
  67063   return __ret;
  67064 }
  67065 #else
  67066 __ai __attribute__((target("sha3,neon"))) int32x4_t vbcaxq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  67067   int32x4_t __ret;
  67068   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67069   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67070   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  67071   __ret = (int32x4_t) __builtin_neon_vbcaxq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
  67072   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67073   return __ret;
  67074 }
  67075 #endif
  67076 
  67077 #ifdef __LITTLE_ENDIAN__
  67078 __ai __attribute__((target("sha3,neon"))) int64x2_t vbcaxq_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  67079   int64x2_t __ret;
  67080   __ret = (int64x2_t) __builtin_neon_vbcaxq_s64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 35);
  67081   return __ret;
  67082 }
  67083 #else
  67084 __ai __attribute__((target("sha3,neon"))) int64x2_t vbcaxq_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  67085   int64x2_t __ret;
  67086   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67087   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67088   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67089   __ret = (int64x2_t) __builtin_neon_vbcaxq_s64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 35);
  67090   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67091   return __ret;
  67092 }
  67093 #endif
  67094 
  67095 #ifdef __LITTLE_ENDIAN__
  67096 __ai __attribute__((target("sha3,neon"))) int16x8_t vbcaxq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  67097   int16x8_t __ret;
  67098   __ret = (int16x8_t) __builtin_neon_vbcaxq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
  67099   return __ret;
  67100 }
  67101 #else
  67102 __ai __attribute__((target("sha3,neon"))) int16x8_t vbcaxq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  67103   int16x8_t __ret;
  67104   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  67105   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  67106   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  67107   __ret = (int16x8_t) __builtin_neon_vbcaxq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33);
  67108   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  67109   return __ret;
  67110 }
  67111 #endif
  67112 
  67113 #ifdef __LITTLE_ENDIAN__
  67114 __ai __attribute__((target("sha3,neon"))) uint8x16_t veor3q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  67115   uint8x16_t __ret;
  67116   __ret = (uint8x16_t) __builtin_neon_veor3q_u8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48);
  67117   return __ret;
  67118 }
  67119 #else
  67120 __ai __attribute__((target("sha3,neon"))) uint8x16_t veor3q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  67121   uint8x16_t __ret;
  67122   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67123   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67124   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67125   __ret = (uint8x16_t) __builtin_neon_veor3q_u8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48);
  67126   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67127   return __ret;
  67128 }
  67129 #endif
  67130 
  67131 #ifdef __LITTLE_ENDIAN__
  67132 __ai __attribute__((target("sha3,neon"))) uint32x4_t veor3q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67133   uint32x4_t __ret;
  67134   __ret = (uint32x4_t) __builtin_neon_veor3q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  67135   return __ret;
  67136 }
  67137 #else
  67138 __ai __attribute__((target("sha3,neon"))) uint32x4_t veor3q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67139   uint32x4_t __ret;
  67140   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67141   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67142   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  67143   __ret = (uint32x4_t) __builtin_neon_veor3q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  67144   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67145   return __ret;
  67146 }
  67147 #endif
  67148 
  67149 #ifdef __LITTLE_ENDIAN__
  67150 __ai __attribute__((target("sha3,neon"))) uint64x2_t veor3q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67151   uint64x2_t __ret;
  67152   __ret = (uint64x2_t) __builtin_neon_veor3q_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51);
  67153   return __ret;
  67154 }
  67155 #else
  67156 __ai __attribute__((target("sha3,neon"))) uint64x2_t veor3q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67157   uint64x2_t __ret;
  67158   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67159   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67160   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67161   __ret = (uint64x2_t) __builtin_neon_veor3q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51);
  67162   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67163   return __ret;
  67164 }
  67165 #endif
  67166 
  67167 #ifdef __LITTLE_ENDIAN__
  67168 __ai __attribute__((target("sha3,neon"))) uint16x8_t veor3q_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  67169   uint16x8_t __ret;
  67170   __ret = (uint16x8_t) __builtin_neon_veor3q_u16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 49);
  67171   return __ret;
  67172 }
  67173 #else
  67174 __ai __attribute__((target("sha3,neon"))) uint16x8_t veor3q_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  67175   uint16x8_t __ret;
  67176   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  67177   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  67178   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  67179   __ret = (uint16x8_t) __builtin_neon_veor3q_u16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 49);
  67180   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  67181   return __ret;
  67182 }
  67183 #endif
  67184 
  67185 #ifdef __LITTLE_ENDIAN__
  67186 __ai __attribute__((target("sha3,neon"))) int8x16_t veor3q_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  67187   int8x16_t __ret;
  67188   __ret = (int8x16_t) __builtin_neon_veor3q_s8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32);
  67189   return __ret;
  67190 }
  67191 #else
  67192 __ai __attribute__((target("sha3,neon"))) int8x16_t veor3q_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  67193   int8x16_t __ret;
  67194   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67195   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67196   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67197   __ret = (int8x16_t) __builtin_neon_veor3q_s8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32);
  67198   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  67199   return __ret;
  67200 }
  67201 #endif
  67202 
  67203 #ifdef __LITTLE_ENDIAN__
  67204 __ai __attribute__((target("sha3,neon"))) int32x4_t veor3q_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  67205   int32x4_t __ret;
  67206   __ret = (int32x4_t) __builtin_neon_veor3q_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34);
  67207   return __ret;
  67208 }
  67209 #else
  67210 __ai __attribute__((target("sha3,neon"))) int32x4_t veor3q_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  67211   int32x4_t __ret;
  67212   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67213   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67214   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  67215   __ret = (int32x4_t) __builtin_neon_veor3q_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34);
  67216   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67217   return __ret;
  67218 }
  67219 #endif
  67220 
  67221 #ifdef __LITTLE_ENDIAN__
  67222 __ai __attribute__((target("sha3,neon"))) int64x2_t veor3q_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  67223   int64x2_t __ret;
  67224   __ret = (int64x2_t) __builtin_neon_veor3q_s64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 35);
  67225   return __ret;
  67226 }
  67227 #else
  67228 __ai __attribute__((target("sha3,neon"))) int64x2_t veor3q_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) {
  67229   int64x2_t __ret;
  67230   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67231   int64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67232   int64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67233   __ret = (int64x2_t) __builtin_neon_veor3q_s64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 35);
  67234   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67235   return __ret;
  67236 }
  67237 #endif
  67238 
  67239 #ifdef __LITTLE_ENDIAN__
  67240 __ai __attribute__((target("sha3,neon"))) int16x8_t veor3q_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  67241   int16x8_t __ret;
  67242   __ret = (int16x8_t) __builtin_neon_veor3q_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33);
  67243   return __ret;
  67244 }
  67245 #else
  67246 __ai __attribute__((target("sha3,neon"))) int16x8_t veor3q_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  67247   int16x8_t __ret;
  67248   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  67249   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  67250   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  67251   __ret = (int16x8_t) __builtin_neon_veor3q_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33);
  67252   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  67253   return __ret;
  67254 }
  67255 #endif
  67256 
  67257 #ifdef __LITTLE_ENDIAN__
  67258 __ai __attribute__((target("sha3,neon"))) uint64x2_t vrax1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  67259   uint64x2_t __ret;
  67260   __ret = (uint64x2_t) __builtin_neon_vrax1q_u64((int8x16_t)__p0, (int8x16_t)__p1, 51);
  67261   return __ret;
  67262 }
  67263 #else
  67264 __ai __attribute__((target("sha3,neon"))) uint64x2_t vrax1q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  67265   uint64x2_t __ret;
  67266   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67267   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67268   __ret = (uint64x2_t) __builtin_neon_vrax1q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  67269   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67270   return __ret;
  67271 }
  67272 #endif
  67273 
  67274 #ifdef __LITTLE_ENDIAN__
  67275 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512hq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67276   uint64x2_t __ret;
  67277   __ret = (uint64x2_t) __builtin_neon_vsha512hq_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51);
  67278   return __ret;
  67279 }
  67280 #else
  67281 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512hq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67282   uint64x2_t __ret;
  67283   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67284   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67285   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67286   __ret = (uint64x2_t) __builtin_neon_vsha512hq_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51);
  67287   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67288   return __ret;
  67289 }
  67290 #endif
  67291 
  67292 #ifdef __LITTLE_ENDIAN__
  67293 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512h2q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67294   uint64x2_t __ret;
  67295   __ret = (uint64x2_t) __builtin_neon_vsha512h2q_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51);
  67296   return __ret;
  67297 }
  67298 #else
  67299 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512h2q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67300   uint64x2_t __ret;
  67301   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67302   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67303   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67304   __ret = (uint64x2_t) __builtin_neon_vsha512h2q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51);
  67305   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67306   return __ret;
  67307 }
  67308 #endif
  67309 
  67310 #ifdef __LITTLE_ENDIAN__
  67311 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su0q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  67312   uint64x2_t __ret;
  67313   __ret = (uint64x2_t) __builtin_neon_vsha512su0q_u64((int8x16_t)__p0, (int8x16_t)__p1, 51);
  67314   return __ret;
  67315 }
  67316 #else
  67317 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su0q_u64(uint64x2_t __p0, uint64x2_t __p1) {
  67318   uint64x2_t __ret;
  67319   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67320   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67321   __ret = (uint64x2_t) __builtin_neon_vsha512su0q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, 51);
  67322   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67323   return __ret;
  67324 }
  67325 #endif
  67326 
  67327 #ifdef __LITTLE_ENDIAN__
  67328 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su1q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67329   uint64x2_t __ret;
  67330   __ret = (uint64x2_t) __builtin_neon_vsha512su1q_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51);
  67331   return __ret;
  67332 }
  67333 #else
  67334 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su1q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) {
  67335   uint64x2_t __ret;
  67336   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67337   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67338   uint64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67339   __ret = (uint64x2_t) __builtin_neon_vsha512su1q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51);
  67340   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67341   return __ret;
  67342 }
  67343 #endif
  67344 
  67345 #ifdef __LITTLE_ENDIAN__
  67346 #define vxarq_u64(__p0, __p1, __p2) __extension__ ({ \
  67347   uint64x2_t __ret; \
  67348   uint64x2_t __s0 = __p0; \
  67349   uint64x2_t __s1 = __p1; \
  67350   __ret = (uint64x2_t) __builtin_neon_vxarq_u64((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \
  67351   __ret; \
  67352 })
  67353 #else
  67354 #define vxarq_u64(__p0, __p1, __p2) __extension__ ({ \
  67355   uint64x2_t __ret; \
  67356   uint64x2_t __s0 = __p0; \
  67357   uint64x2_t __s1 = __p1; \
  67358   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \
  67359   uint64x2_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \
  67360   __ret = (uint64x2_t) __builtin_neon_vxarq_u64((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \
  67361   __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \
  67362   __ret; \
  67363 })
  67364 #endif
  67365 
  67366 #ifdef __LITTLE_ENDIAN__
  67367 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67368   uint32x4_t __ret;
  67369   __ret = (uint32x4_t) __builtin_neon_vsm3partw1q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  67370   return __ret;
  67371 }
  67372 #else
  67373 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67374   uint32x4_t __ret;
  67375   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67376   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67377   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  67378   __ret = (uint32x4_t) __builtin_neon_vsm3partw1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  67379   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67380   return __ret;
  67381 }
  67382 #endif
  67383 
  67384 #ifdef __LITTLE_ENDIAN__
  67385 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67386   uint32x4_t __ret;
  67387   __ret = (uint32x4_t) __builtin_neon_vsm3partw2q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  67388   return __ret;
  67389 }
  67390 #else
  67391 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67392   uint32x4_t __ret;
  67393   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67394   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67395   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  67396   __ret = (uint32x4_t) __builtin_neon_vsm3partw2q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  67397   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67398   return __ret;
  67399 }
  67400 #endif
  67401 
  67402 #ifdef __LITTLE_ENDIAN__
  67403 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3ss1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67404   uint32x4_t __ret;
  67405   __ret = (uint32x4_t) __builtin_neon_vsm3ss1q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50);
  67406   return __ret;
  67407 }
  67408 #else
  67409 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3ss1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  67410   uint32x4_t __ret;
  67411   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67412   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67413   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  67414   __ret = (uint32x4_t) __builtin_neon_vsm3ss1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50);
  67415   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67416   return __ret;
  67417 }
  67418 #endif
  67419 
  67420 #ifdef __LITTLE_ENDIAN__
  67421 #define vsm3tt1aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67422   uint32x4_t __ret; \
  67423   uint32x4_t __s0 = __p0; \
  67424   uint32x4_t __s1 = __p1; \
  67425   uint32x4_t __s2 = __p2; \
  67426   __ret = (uint32x4_t) __builtin_neon_vsm3tt1aq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \
  67427   __ret; \
  67428 })
  67429 #else
  67430 #define vsm3tt1aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67431   uint32x4_t __ret; \
  67432   uint32x4_t __s0 = __p0; \
  67433   uint32x4_t __s1 = __p1; \
  67434   uint32x4_t __s2 = __p2; \
  67435   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  67436   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  67437   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  67438   __ret = (uint32x4_t) __builtin_neon_vsm3tt1aq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \
  67439   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  67440   __ret; \
  67441 })
  67442 #endif
  67443 
  67444 #ifdef __LITTLE_ENDIAN__
  67445 #define vsm3tt1bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67446   uint32x4_t __ret; \
  67447   uint32x4_t __s0 = __p0; \
  67448   uint32x4_t __s1 = __p1; \
  67449   uint32x4_t __s2 = __p2; \
  67450   __ret = (uint32x4_t) __builtin_neon_vsm3tt1bq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \
  67451   __ret; \
  67452 })
  67453 #else
  67454 #define vsm3tt1bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67455   uint32x4_t __ret; \
  67456   uint32x4_t __s0 = __p0; \
  67457   uint32x4_t __s1 = __p1; \
  67458   uint32x4_t __s2 = __p2; \
  67459   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  67460   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  67461   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  67462   __ret = (uint32x4_t) __builtin_neon_vsm3tt1bq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \
  67463   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  67464   __ret; \
  67465 })
  67466 #endif
  67467 
  67468 #ifdef __LITTLE_ENDIAN__
  67469 #define vsm3tt2aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67470   uint32x4_t __ret; \
  67471   uint32x4_t __s0 = __p0; \
  67472   uint32x4_t __s1 = __p1; \
  67473   uint32x4_t __s2 = __p2; \
  67474   __ret = (uint32x4_t) __builtin_neon_vsm3tt2aq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \
  67475   __ret; \
  67476 })
  67477 #else
  67478 #define vsm3tt2aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67479   uint32x4_t __ret; \
  67480   uint32x4_t __s0 = __p0; \
  67481   uint32x4_t __s1 = __p1; \
  67482   uint32x4_t __s2 = __p2; \
  67483   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  67484   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  67485   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  67486   __ret = (uint32x4_t) __builtin_neon_vsm3tt2aq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \
  67487   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  67488   __ret; \
  67489 })
  67490 #endif
  67491 
  67492 #ifdef __LITTLE_ENDIAN__
  67493 #define vsm3tt2bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67494   uint32x4_t __ret; \
  67495   uint32x4_t __s0 = __p0; \
  67496   uint32x4_t __s1 = __p1; \
  67497   uint32x4_t __s2 = __p2; \
  67498   __ret = (uint32x4_t) __builtin_neon_vsm3tt2bq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \
  67499   __ret; \
  67500 })
  67501 #else
  67502 #define vsm3tt2bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \
  67503   uint32x4_t __ret; \
  67504   uint32x4_t __s0 = __p0; \
  67505   uint32x4_t __s1 = __p1; \
  67506   uint32x4_t __s2 = __p2; \
  67507   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \
  67508   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \
  67509   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \
  67510   __ret = (uint32x4_t) __builtin_neon_vsm3tt2bq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \
  67511   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \
  67512   __ret; \
  67513 })
  67514 #endif
  67515 
  67516 #ifdef __LITTLE_ENDIAN__
  67517 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4eq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  67518   uint32x4_t __ret;
  67519   __ret = (uint32x4_t) __builtin_neon_vsm4eq_u32((int8x16_t)__p0, (int8x16_t)__p1, 50);
  67520   return __ret;
  67521 }
  67522 #else
  67523 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4eq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  67524   uint32x4_t __ret;
  67525   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67526   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67527   __ret = (uint32x4_t) __builtin_neon_vsm4eq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  67528   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67529   return __ret;
  67530 }
  67531 #endif
  67532 
  67533 #ifdef __LITTLE_ENDIAN__
  67534 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4ekeyq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  67535   uint32x4_t __ret;
  67536   __ret = (uint32x4_t) __builtin_neon_vsm4ekeyq_u32((int8x16_t)__p0, (int8x16_t)__p1, 50);
  67537   return __ret;
  67538 }
  67539 #else
  67540 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4ekeyq_u32(uint32x4_t __p0, uint32x4_t __p1) {
  67541   uint32x4_t __ret;
  67542   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  67543   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  67544   __ret = (uint32x4_t) __builtin_neon_vsm4ekeyq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50);
  67545   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  67546   return __ret;
  67547 }
  67548 #endif
  67549 
  67550 __ai __attribute__((target("v8.1a,neon"))) int32_t vqrdmlahs_s32(int32_t __p0, int32_t __p1, int32_t __p2) {
  67551   int32_t __ret;
  67552   __ret = (int32_t) __builtin_neon_vqrdmlahs_s32(__p0, __p1, __p2);
  67553   return __ret;
  67554 }
  67555 __ai __attribute__((target("v8.1a,neon"))) int16_t vqrdmlahh_s16(int16_t __p0, int16_t __p1, int16_t __p2) {
  67556   int16_t __ret;
  67557   __ret = (int16_t) __builtin_neon_vqrdmlahh_s16(__p0, __p1, __p2);
  67558   return __ret;
  67559 }
  67560 #ifdef __LITTLE_ENDIAN__
  67561 #define vqrdmlahs_lane_s32(__p0_760, __p1_760, __p2_760, __p3_760) __extension__ ({ \
  67562   int32_t __ret_760; \
  67563   int32_t __s0_760 = __p0_760; \
  67564   int32_t __s1_760 = __p1_760; \
  67565   int32x2_t __s2_760 = __p2_760; \
  67566   __ret_760 = vqrdmlahs_s32(__s0_760, __s1_760, vget_lane_s32(__s2_760, __p3_760)); \
  67567   __ret_760; \
  67568 })
  67569 #else
  67570 #define vqrdmlahs_lane_s32(__p0_761, __p1_761, __p2_761, __p3_761) __extension__ ({ \
  67571   int32_t __ret_761; \
  67572   int32_t __s0_761 = __p0_761; \
  67573   int32_t __s1_761 = __p1_761; \
  67574   int32x2_t __s2_761 = __p2_761; \
  67575   int32x2_t __rev2_761;  __rev2_761 = __builtin_shufflevector(__s2_761, __s2_761, 1, 0); \
  67576   __ret_761 = vqrdmlahs_s32(__s0_761, __s1_761, __noswap_vget_lane_s32(__rev2_761, __p3_761)); \
  67577   __ret_761; \
  67578 })
  67579 #endif
  67580 
  67581 #ifdef __LITTLE_ENDIAN__
  67582 #define vqrdmlahh_lane_s16(__p0_762, __p1_762, __p2_762, __p3_762) __extension__ ({ \
  67583   int16_t __ret_762; \
  67584   int16_t __s0_762 = __p0_762; \
  67585   int16_t __s1_762 = __p1_762; \
  67586   int16x4_t __s2_762 = __p2_762; \
  67587   __ret_762 = vqrdmlahh_s16(__s0_762, __s1_762, vget_lane_s16(__s2_762, __p3_762)); \
  67588   __ret_762; \
  67589 })
  67590 #else
  67591 #define vqrdmlahh_lane_s16(__p0_763, __p1_763, __p2_763, __p3_763) __extension__ ({ \
  67592   int16_t __ret_763; \
  67593   int16_t __s0_763 = __p0_763; \
  67594   int16_t __s1_763 = __p1_763; \
  67595   int16x4_t __s2_763 = __p2_763; \
  67596   int16x4_t __rev2_763;  __rev2_763 = __builtin_shufflevector(__s2_763, __s2_763, 3, 2, 1, 0); \
  67597   __ret_763 = vqrdmlahh_s16(__s0_763, __s1_763, __noswap_vget_lane_s16(__rev2_763, __p3_763)); \
  67598   __ret_763; \
  67599 })
  67600 #endif
  67601 
  67602 #ifdef __LITTLE_ENDIAN__
  67603 #define vqrdmlahs_laneq_s32(__p0_764, __p1_764, __p2_764, __p3_764) __extension__ ({ \
  67604   int32_t __ret_764; \
  67605   int32_t __s0_764 = __p0_764; \
  67606   int32_t __s1_764 = __p1_764; \
  67607   int32x4_t __s2_764 = __p2_764; \
  67608   __ret_764 = vqrdmlahs_s32(__s0_764, __s1_764, vgetq_lane_s32(__s2_764, __p3_764)); \
  67609   __ret_764; \
  67610 })
  67611 #else
  67612 #define vqrdmlahs_laneq_s32(__p0_765, __p1_765, __p2_765, __p3_765) __extension__ ({ \
  67613   int32_t __ret_765; \
  67614   int32_t __s0_765 = __p0_765; \
  67615   int32_t __s1_765 = __p1_765; \
  67616   int32x4_t __s2_765 = __p2_765; \
  67617   int32x4_t __rev2_765;  __rev2_765 = __builtin_shufflevector(__s2_765, __s2_765, 3, 2, 1, 0); \
  67618   __ret_765 = vqrdmlahs_s32(__s0_765, __s1_765, __noswap_vgetq_lane_s32(__rev2_765, __p3_765)); \
  67619   __ret_765; \
  67620 })
  67621 #endif
  67622 
  67623 #ifdef __LITTLE_ENDIAN__
  67624 #define vqrdmlahh_laneq_s16(__p0_766, __p1_766, __p2_766, __p3_766) __extension__ ({ \
  67625   int16_t __ret_766; \
  67626   int16_t __s0_766 = __p0_766; \
  67627   int16_t __s1_766 = __p1_766; \
  67628   int16x8_t __s2_766 = __p2_766; \
  67629   __ret_766 = vqrdmlahh_s16(__s0_766, __s1_766, vgetq_lane_s16(__s2_766, __p3_766)); \
  67630   __ret_766; \
  67631 })
  67632 #else
  67633 #define vqrdmlahh_laneq_s16(__p0_767, __p1_767, __p2_767, __p3_767) __extension__ ({ \
  67634   int16_t __ret_767; \
  67635   int16_t __s0_767 = __p0_767; \
  67636   int16_t __s1_767 = __p1_767; \
  67637   int16x8_t __s2_767 = __p2_767; \
  67638   int16x8_t __rev2_767;  __rev2_767 = __builtin_shufflevector(__s2_767, __s2_767, 7, 6, 5, 4, 3, 2, 1, 0); \
  67639   __ret_767 = vqrdmlahh_s16(__s0_767, __s1_767, __noswap_vgetq_lane_s16(__rev2_767, __p3_767)); \
  67640   __ret_767; \
  67641 })
  67642 #endif
  67643 
  67644 #ifdef __LITTLE_ENDIAN__
  67645 #define vqrdmlahq_laneq_s32(__p0_768, __p1_768, __p2_768, __p3_768) __extension__ ({ \
  67646   int32x4_t __ret_768; \
  67647   int32x4_t __s0_768 = __p0_768; \
  67648   int32x4_t __s1_768 = __p1_768; \
  67649   int32x4_t __s2_768 = __p2_768; \
  67650   __ret_768 = vqrdmlahq_s32(__s0_768, __s1_768, splatq_laneq_s32(__s2_768, __p3_768)); \
  67651   __ret_768; \
  67652 })
  67653 #else
  67654 #define vqrdmlahq_laneq_s32(__p0_769, __p1_769, __p2_769, __p3_769) __extension__ ({ \
  67655   int32x4_t __ret_769; \
  67656   int32x4_t __s0_769 = __p0_769; \
  67657   int32x4_t __s1_769 = __p1_769; \
  67658   int32x4_t __s2_769 = __p2_769; \
  67659   int32x4_t __rev0_769;  __rev0_769 = __builtin_shufflevector(__s0_769, __s0_769, 3, 2, 1, 0); \
  67660   int32x4_t __rev1_769;  __rev1_769 = __builtin_shufflevector(__s1_769, __s1_769, 3, 2, 1, 0); \
  67661   int32x4_t __rev2_769;  __rev2_769 = __builtin_shufflevector(__s2_769, __s2_769, 3, 2, 1, 0); \
  67662   __ret_769 = __noswap_vqrdmlahq_s32(__rev0_769, __rev1_769, __noswap_splatq_laneq_s32(__rev2_769, __p3_769)); \
  67663   __ret_769 = __builtin_shufflevector(__ret_769, __ret_769, 3, 2, 1, 0); \
  67664   __ret_769; \
  67665 })
  67666 #endif
  67667 
  67668 #ifdef __LITTLE_ENDIAN__
  67669 #define vqrdmlahq_laneq_s16(__p0_770, __p1_770, __p2_770, __p3_770) __extension__ ({ \
  67670   int16x8_t __ret_770; \
  67671   int16x8_t __s0_770 = __p0_770; \
  67672   int16x8_t __s1_770 = __p1_770; \
  67673   int16x8_t __s2_770 = __p2_770; \
  67674   __ret_770 = vqrdmlahq_s16(__s0_770, __s1_770, splatq_laneq_s16(__s2_770, __p3_770)); \
  67675   __ret_770; \
  67676 })
  67677 #else
  67678 #define vqrdmlahq_laneq_s16(__p0_771, __p1_771, __p2_771, __p3_771) __extension__ ({ \
  67679   int16x8_t __ret_771; \
  67680   int16x8_t __s0_771 = __p0_771; \
  67681   int16x8_t __s1_771 = __p1_771; \
  67682   int16x8_t __s2_771 = __p2_771; \
  67683   int16x8_t __rev0_771;  __rev0_771 = __builtin_shufflevector(__s0_771, __s0_771, 7, 6, 5, 4, 3, 2, 1, 0); \
  67684   int16x8_t __rev1_771;  __rev1_771 = __builtin_shufflevector(__s1_771, __s1_771, 7, 6, 5, 4, 3, 2, 1, 0); \
  67685   int16x8_t __rev2_771;  __rev2_771 = __builtin_shufflevector(__s2_771, __s2_771, 7, 6, 5, 4, 3, 2, 1, 0); \
  67686   __ret_771 = __noswap_vqrdmlahq_s16(__rev0_771, __rev1_771, __noswap_splatq_laneq_s16(__rev2_771, __p3_771)); \
  67687   __ret_771 = __builtin_shufflevector(__ret_771, __ret_771, 7, 6, 5, 4, 3, 2, 1, 0); \
  67688   __ret_771; \
  67689 })
  67690 #endif
  67691 
  67692 #ifdef __LITTLE_ENDIAN__
  67693 #define vqrdmlah_laneq_s32(__p0_772, __p1_772, __p2_772, __p3_772) __extension__ ({ \
  67694   int32x2_t __ret_772; \
  67695   int32x2_t __s0_772 = __p0_772; \
  67696   int32x2_t __s1_772 = __p1_772; \
  67697   int32x4_t __s2_772 = __p2_772; \
  67698   __ret_772 = vqrdmlah_s32(__s0_772, __s1_772, splat_laneq_s32(__s2_772, __p3_772)); \
  67699   __ret_772; \
  67700 })
  67701 #else
  67702 #define vqrdmlah_laneq_s32(__p0_773, __p1_773, __p2_773, __p3_773) __extension__ ({ \
  67703   int32x2_t __ret_773; \
  67704   int32x2_t __s0_773 = __p0_773; \
  67705   int32x2_t __s1_773 = __p1_773; \
  67706   int32x4_t __s2_773 = __p2_773; \
  67707   int32x2_t __rev0_773;  __rev0_773 = __builtin_shufflevector(__s0_773, __s0_773, 1, 0); \
  67708   int32x2_t __rev1_773;  __rev1_773 = __builtin_shufflevector(__s1_773, __s1_773, 1, 0); \
  67709   int32x4_t __rev2_773;  __rev2_773 = __builtin_shufflevector(__s2_773, __s2_773, 3, 2, 1, 0); \
  67710   __ret_773 = __noswap_vqrdmlah_s32(__rev0_773, __rev1_773, __noswap_splat_laneq_s32(__rev2_773, __p3_773)); \
  67711   __ret_773 = __builtin_shufflevector(__ret_773, __ret_773, 1, 0); \
  67712   __ret_773; \
  67713 })
  67714 #endif
  67715 
  67716 #ifdef __LITTLE_ENDIAN__
  67717 #define vqrdmlah_laneq_s16(__p0_774, __p1_774, __p2_774, __p3_774) __extension__ ({ \
  67718   int16x4_t __ret_774; \
  67719   int16x4_t __s0_774 = __p0_774; \
  67720   int16x4_t __s1_774 = __p1_774; \
  67721   int16x8_t __s2_774 = __p2_774; \
  67722   __ret_774 = vqrdmlah_s16(__s0_774, __s1_774, splat_laneq_s16(__s2_774, __p3_774)); \
  67723   __ret_774; \
  67724 })
  67725 #else
  67726 #define vqrdmlah_laneq_s16(__p0_775, __p1_775, __p2_775, __p3_775) __extension__ ({ \
  67727   int16x4_t __ret_775; \
  67728   int16x4_t __s0_775 = __p0_775; \
  67729   int16x4_t __s1_775 = __p1_775; \
  67730   int16x8_t __s2_775 = __p2_775; \
  67731   int16x4_t __rev0_775;  __rev0_775 = __builtin_shufflevector(__s0_775, __s0_775, 3, 2, 1, 0); \
  67732   int16x4_t __rev1_775;  __rev1_775 = __builtin_shufflevector(__s1_775, __s1_775, 3, 2, 1, 0); \
  67733   int16x8_t __rev2_775;  __rev2_775 = __builtin_shufflevector(__s2_775, __s2_775, 7, 6, 5, 4, 3, 2, 1, 0); \
  67734   __ret_775 = __noswap_vqrdmlah_s16(__rev0_775, __rev1_775, __noswap_splat_laneq_s16(__rev2_775, __p3_775)); \
  67735   __ret_775 = __builtin_shufflevector(__ret_775, __ret_775, 3, 2, 1, 0); \
  67736   __ret_775; \
  67737 })
  67738 #endif
  67739 
  67740 __ai __attribute__((target("v8.1a,neon"))) int32_t vqrdmlshs_s32(int32_t __p0, int32_t __p1, int32_t __p2) {
  67741   int32_t __ret;
  67742   __ret = (int32_t) __builtin_neon_vqrdmlshs_s32(__p0, __p1, __p2);
  67743   return __ret;
  67744 }
  67745 __ai __attribute__((target("v8.1a,neon"))) int16_t vqrdmlshh_s16(int16_t __p0, int16_t __p1, int16_t __p2) {
  67746   int16_t __ret;
  67747   __ret = (int16_t) __builtin_neon_vqrdmlshh_s16(__p0, __p1, __p2);
  67748   return __ret;
  67749 }
  67750 #ifdef __LITTLE_ENDIAN__
  67751 #define vqrdmlshs_lane_s32(__p0_776, __p1_776, __p2_776, __p3_776) __extension__ ({ \
  67752   int32_t __ret_776; \
  67753   int32_t __s0_776 = __p0_776; \
  67754   int32_t __s1_776 = __p1_776; \
  67755   int32x2_t __s2_776 = __p2_776; \
  67756   __ret_776 = vqrdmlshs_s32(__s0_776, __s1_776, vget_lane_s32(__s2_776, __p3_776)); \
  67757   __ret_776; \
  67758 })
  67759 #else
  67760 #define vqrdmlshs_lane_s32(__p0_777, __p1_777, __p2_777, __p3_777) __extension__ ({ \
  67761   int32_t __ret_777; \
  67762   int32_t __s0_777 = __p0_777; \
  67763   int32_t __s1_777 = __p1_777; \
  67764   int32x2_t __s2_777 = __p2_777; \
  67765   int32x2_t __rev2_777;  __rev2_777 = __builtin_shufflevector(__s2_777, __s2_777, 1, 0); \
  67766   __ret_777 = vqrdmlshs_s32(__s0_777, __s1_777, __noswap_vget_lane_s32(__rev2_777, __p3_777)); \
  67767   __ret_777; \
  67768 })
  67769 #endif
  67770 
  67771 #ifdef __LITTLE_ENDIAN__
  67772 #define vqrdmlshh_lane_s16(__p0_778, __p1_778, __p2_778, __p3_778) __extension__ ({ \
  67773   int16_t __ret_778; \
  67774   int16_t __s0_778 = __p0_778; \
  67775   int16_t __s1_778 = __p1_778; \
  67776   int16x4_t __s2_778 = __p2_778; \
  67777   __ret_778 = vqrdmlshh_s16(__s0_778, __s1_778, vget_lane_s16(__s2_778, __p3_778)); \
  67778   __ret_778; \
  67779 })
  67780 #else
  67781 #define vqrdmlshh_lane_s16(__p0_779, __p1_779, __p2_779, __p3_779) __extension__ ({ \
  67782   int16_t __ret_779; \
  67783   int16_t __s0_779 = __p0_779; \
  67784   int16_t __s1_779 = __p1_779; \
  67785   int16x4_t __s2_779 = __p2_779; \
  67786   int16x4_t __rev2_779;  __rev2_779 = __builtin_shufflevector(__s2_779, __s2_779, 3, 2, 1, 0); \
  67787   __ret_779 = vqrdmlshh_s16(__s0_779, __s1_779, __noswap_vget_lane_s16(__rev2_779, __p3_779)); \
  67788   __ret_779; \
  67789 })
  67790 #endif
  67791 
  67792 #ifdef __LITTLE_ENDIAN__
  67793 #define vqrdmlshs_laneq_s32(__p0_780, __p1_780, __p2_780, __p3_780) __extension__ ({ \
  67794   int32_t __ret_780; \
  67795   int32_t __s0_780 = __p0_780; \
  67796   int32_t __s1_780 = __p1_780; \
  67797   int32x4_t __s2_780 = __p2_780; \
  67798   __ret_780 = vqrdmlshs_s32(__s0_780, __s1_780, vgetq_lane_s32(__s2_780, __p3_780)); \
  67799   __ret_780; \
  67800 })
  67801 #else
  67802 #define vqrdmlshs_laneq_s32(__p0_781, __p1_781, __p2_781, __p3_781) __extension__ ({ \
  67803   int32_t __ret_781; \
  67804   int32_t __s0_781 = __p0_781; \
  67805   int32_t __s1_781 = __p1_781; \
  67806   int32x4_t __s2_781 = __p2_781; \
  67807   int32x4_t __rev2_781;  __rev2_781 = __builtin_shufflevector(__s2_781, __s2_781, 3, 2, 1, 0); \
  67808   __ret_781 = vqrdmlshs_s32(__s0_781, __s1_781, __noswap_vgetq_lane_s32(__rev2_781, __p3_781)); \
  67809   __ret_781; \
  67810 })
  67811 #endif
  67812 
  67813 #ifdef __LITTLE_ENDIAN__
  67814 #define vqrdmlshh_laneq_s16(__p0_782, __p1_782, __p2_782, __p3_782) __extension__ ({ \
  67815   int16_t __ret_782; \
  67816   int16_t __s0_782 = __p0_782; \
  67817   int16_t __s1_782 = __p1_782; \
  67818   int16x8_t __s2_782 = __p2_782; \
  67819   __ret_782 = vqrdmlshh_s16(__s0_782, __s1_782, vgetq_lane_s16(__s2_782, __p3_782)); \
  67820   __ret_782; \
  67821 })
  67822 #else
  67823 #define vqrdmlshh_laneq_s16(__p0_783, __p1_783, __p2_783, __p3_783) __extension__ ({ \
  67824   int16_t __ret_783; \
  67825   int16_t __s0_783 = __p0_783; \
  67826   int16_t __s1_783 = __p1_783; \
  67827   int16x8_t __s2_783 = __p2_783; \
  67828   int16x8_t __rev2_783;  __rev2_783 = __builtin_shufflevector(__s2_783, __s2_783, 7, 6, 5, 4, 3, 2, 1, 0); \
  67829   __ret_783 = vqrdmlshh_s16(__s0_783, __s1_783, __noswap_vgetq_lane_s16(__rev2_783, __p3_783)); \
  67830   __ret_783; \
  67831 })
  67832 #endif
  67833 
  67834 #ifdef __LITTLE_ENDIAN__
  67835 #define vqrdmlshq_laneq_s32(__p0_784, __p1_784, __p2_784, __p3_784) __extension__ ({ \
  67836   int32x4_t __ret_784; \
  67837   int32x4_t __s0_784 = __p0_784; \
  67838   int32x4_t __s1_784 = __p1_784; \
  67839   int32x4_t __s2_784 = __p2_784; \
  67840   __ret_784 = vqrdmlshq_s32(__s0_784, __s1_784, splatq_laneq_s32(__s2_784, __p3_784)); \
  67841   __ret_784; \
  67842 })
  67843 #else
  67844 #define vqrdmlshq_laneq_s32(__p0_785, __p1_785, __p2_785, __p3_785) __extension__ ({ \
  67845   int32x4_t __ret_785; \
  67846   int32x4_t __s0_785 = __p0_785; \
  67847   int32x4_t __s1_785 = __p1_785; \
  67848   int32x4_t __s2_785 = __p2_785; \
  67849   int32x4_t __rev0_785;  __rev0_785 = __builtin_shufflevector(__s0_785, __s0_785, 3, 2, 1, 0); \
  67850   int32x4_t __rev1_785;  __rev1_785 = __builtin_shufflevector(__s1_785, __s1_785, 3, 2, 1, 0); \
  67851   int32x4_t __rev2_785;  __rev2_785 = __builtin_shufflevector(__s2_785, __s2_785, 3, 2, 1, 0); \
  67852   __ret_785 = __noswap_vqrdmlshq_s32(__rev0_785, __rev1_785, __noswap_splatq_laneq_s32(__rev2_785, __p3_785)); \
  67853   __ret_785 = __builtin_shufflevector(__ret_785, __ret_785, 3, 2, 1, 0); \
  67854   __ret_785; \
  67855 })
  67856 #endif
  67857 
  67858 #ifdef __LITTLE_ENDIAN__
  67859 #define vqrdmlshq_laneq_s16(__p0_786, __p1_786, __p2_786, __p3_786) __extension__ ({ \
  67860   int16x8_t __ret_786; \
  67861   int16x8_t __s0_786 = __p0_786; \
  67862   int16x8_t __s1_786 = __p1_786; \
  67863   int16x8_t __s2_786 = __p2_786; \
  67864   __ret_786 = vqrdmlshq_s16(__s0_786, __s1_786, splatq_laneq_s16(__s2_786, __p3_786)); \
  67865   __ret_786; \
  67866 })
  67867 #else
  67868 #define vqrdmlshq_laneq_s16(__p0_787, __p1_787, __p2_787, __p3_787) __extension__ ({ \
  67869   int16x8_t __ret_787; \
  67870   int16x8_t __s0_787 = __p0_787; \
  67871   int16x8_t __s1_787 = __p1_787; \
  67872   int16x8_t __s2_787 = __p2_787; \
  67873   int16x8_t __rev0_787;  __rev0_787 = __builtin_shufflevector(__s0_787, __s0_787, 7, 6, 5, 4, 3, 2, 1, 0); \
  67874   int16x8_t __rev1_787;  __rev1_787 = __builtin_shufflevector(__s1_787, __s1_787, 7, 6, 5, 4, 3, 2, 1, 0); \
  67875   int16x8_t __rev2_787;  __rev2_787 = __builtin_shufflevector(__s2_787, __s2_787, 7, 6, 5, 4, 3, 2, 1, 0); \
  67876   __ret_787 = __noswap_vqrdmlshq_s16(__rev0_787, __rev1_787, __noswap_splatq_laneq_s16(__rev2_787, __p3_787)); \
  67877   __ret_787 = __builtin_shufflevector(__ret_787, __ret_787, 7, 6, 5, 4, 3, 2, 1, 0); \
  67878   __ret_787; \
  67879 })
  67880 #endif
  67881 
  67882 #ifdef __LITTLE_ENDIAN__
  67883 #define vqrdmlsh_laneq_s32(__p0_788, __p1_788, __p2_788, __p3_788) __extension__ ({ \
  67884   int32x2_t __ret_788; \
  67885   int32x2_t __s0_788 = __p0_788; \
  67886   int32x2_t __s1_788 = __p1_788; \
  67887   int32x4_t __s2_788 = __p2_788; \
  67888   __ret_788 = vqrdmlsh_s32(__s0_788, __s1_788, splat_laneq_s32(__s2_788, __p3_788)); \
  67889   __ret_788; \
  67890 })
  67891 #else
  67892 #define vqrdmlsh_laneq_s32(__p0_789, __p1_789, __p2_789, __p3_789) __extension__ ({ \
  67893   int32x2_t __ret_789; \
  67894   int32x2_t __s0_789 = __p0_789; \
  67895   int32x2_t __s1_789 = __p1_789; \
  67896   int32x4_t __s2_789 = __p2_789; \
  67897   int32x2_t __rev0_789;  __rev0_789 = __builtin_shufflevector(__s0_789, __s0_789, 1, 0); \
  67898   int32x2_t __rev1_789;  __rev1_789 = __builtin_shufflevector(__s1_789, __s1_789, 1, 0); \
  67899   int32x4_t __rev2_789;  __rev2_789 = __builtin_shufflevector(__s2_789, __s2_789, 3, 2, 1, 0); \
  67900   __ret_789 = __noswap_vqrdmlsh_s32(__rev0_789, __rev1_789, __noswap_splat_laneq_s32(__rev2_789, __p3_789)); \
  67901   __ret_789 = __builtin_shufflevector(__ret_789, __ret_789, 1, 0); \
  67902   __ret_789; \
  67903 })
  67904 #endif
  67905 
  67906 #ifdef __LITTLE_ENDIAN__
  67907 #define vqrdmlsh_laneq_s16(__p0_790, __p1_790, __p2_790, __p3_790) __extension__ ({ \
  67908   int16x4_t __ret_790; \
  67909   int16x4_t __s0_790 = __p0_790; \
  67910   int16x4_t __s1_790 = __p1_790; \
  67911   int16x8_t __s2_790 = __p2_790; \
  67912   __ret_790 = vqrdmlsh_s16(__s0_790, __s1_790, splat_laneq_s16(__s2_790, __p3_790)); \
  67913   __ret_790; \
  67914 })
  67915 #else
  67916 #define vqrdmlsh_laneq_s16(__p0_791, __p1_791, __p2_791, __p3_791) __extension__ ({ \
  67917   int16x4_t __ret_791; \
  67918   int16x4_t __s0_791 = __p0_791; \
  67919   int16x4_t __s1_791 = __p1_791; \
  67920   int16x8_t __s2_791 = __p2_791; \
  67921   int16x4_t __rev0_791;  __rev0_791 = __builtin_shufflevector(__s0_791, __s0_791, 3, 2, 1, 0); \
  67922   int16x4_t __rev1_791;  __rev1_791 = __builtin_shufflevector(__s1_791, __s1_791, 3, 2, 1, 0); \
  67923   int16x8_t __rev2_791;  __rev2_791 = __builtin_shufflevector(__s2_791, __s2_791, 7, 6, 5, 4, 3, 2, 1, 0); \
  67924   __ret_791 = __noswap_vqrdmlsh_s16(__rev0_791, __rev1_791, __noswap_splat_laneq_s16(__rev2_791, __p3_791)); \
  67925   __ret_791 = __builtin_shufflevector(__ret_791, __ret_791, 3, 2, 1, 0); \
  67926   __ret_791; \
  67927 })
  67928 #endif
  67929 
  67930 #ifdef __LITTLE_ENDIAN__
  67931 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot270_f64(float64x2_t __p0, float64x2_t __p1) {
  67932   float64x2_t __ret;
  67933   __ret = (float64x2_t) __builtin_neon_vcaddq_rot270_f64((int8x16_t)__p0, (int8x16_t)__p1, 42);
  67934   return __ret;
  67935 }
  67936 #else
  67937 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot270_f64(float64x2_t __p0, float64x2_t __p1) {
  67938   float64x2_t __ret;
  67939   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67940   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67941   __ret = (float64x2_t) __builtin_neon_vcaddq_rot270_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  67942   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67943   return __ret;
  67944 }
  67945 #endif
  67946 
  67947 #ifdef __LITTLE_ENDIAN__
  67948 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot90_f64(float64x2_t __p0, float64x2_t __p1) {
  67949   float64x2_t __ret;
  67950   __ret = (float64x2_t) __builtin_neon_vcaddq_rot90_f64((int8x16_t)__p0, (int8x16_t)__p1, 42);
  67951   return __ret;
  67952 }
  67953 #else
  67954 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot90_f64(float64x2_t __p0, float64x2_t __p1) {
  67955   float64x2_t __ret;
  67956   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67957   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67958   __ret = (float64x2_t) __builtin_neon_vcaddq_rot90_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42);
  67959   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67960   return __ret;
  67961 }
  67962 #endif
  67963 
  67964 #ifdef __LITTLE_ENDIAN__
  67965 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  67966   float64x2_t __ret;
  67967   __ret = (float64x2_t) __builtin_neon_vcmlaq_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  67968   return __ret;
  67969 }
  67970 #else
  67971 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  67972   float64x2_t __ret;
  67973   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67974   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67975   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67976   __ret = (float64x2_t) __builtin_neon_vcmlaq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42);
  67977   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67978   return __ret;
  67979 }
  67980 #endif
  67981 
  67982 #ifdef __LITTLE_ENDIAN__
  67983 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot180_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  67984   float64x2_t __ret;
  67985   __ret = (float64x2_t) __builtin_neon_vcmlaq_rot180_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  67986   return __ret;
  67987 }
  67988 #else
  67989 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot180_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  67990   float64x2_t __ret;
  67991   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  67992   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  67993   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  67994   __ret = (float64x2_t) __builtin_neon_vcmlaq_rot180_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42);
  67995   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  67996   return __ret;
  67997 }
  67998 #endif
  67999 
  68000 #ifdef __LITTLE_ENDIAN__
  68001 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot270_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  68002   float64x2_t __ret;
  68003   __ret = (float64x2_t) __builtin_neon_vcmlaq_rot270_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  68004   return __ret;
  68005 }
  68006 #else
  68007 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot270_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  68008   float64x2_t __ret;
  68009   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68010   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  68011   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  68012   __ret = (float64x2_t) __builtin_neon_vcmlaq_rot270_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42);
  68013   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68014   return __ret;
  68015 }
  68016 #endif
  68017 
  68018 #ifdef __LITTLE_ENDIAN__
  68019 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot90_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  68020   float64x2_t __ret;
  68021   __ret = (float64x2_t) __builtin_neon_vcmlaq_rot90_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42);
  68022   return __ret;
  68023 }
  68024 #else
  68025 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot90_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) {
  68026   float64x2_t __ret;
  68027   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68028   float64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  68029   float64x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  68030   __ret = (float64x2_t) __builtin_neon_vcmlaq_rot90_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42);
  68031   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68032   return __ret;
  68033 }
  68034 #endif
  68035 
  68036 #ifdef __LITTLE_ENDIAN__
  68037 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32xq_f32(float32x4_t __p0) {
  68038   float32x4_t __ret;
  68039   __ret = (float32x4_t) __builtin_neon_vrnd32xq_f32((int8x16_t)__p0, 41);
  68040   return __ret;
  68041 }
  68042 #else
  68043 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32xq_f32(float32x4_t __p0) {
  68044   float32x4_t __ret;
  68045   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68046   __ret = (float32x4_t) __builtin_neon_vrnd32xq_f32((int8x16_t)__rev0, 41);
  68047   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68048   return __ret;
  68049 }
  68050 #endif
  68051 
  68052 #ifdef __LITTLE_ENDIAN__
  68053 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32x_f32(float32x2_t __p0) {
  68054   float32x2_t __ret;
  68055   __ret = (float32x2_t) __builtin_neon_vrnd32x_f32((int8x8_t)__p0, 9);
  68056   return __ret;
  68057 }
  68058 #else
  68059 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32x_f32(float32x2_t __p0) {
  68060   float32x2_t __ret;
  68061   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68062   __ret = (float32x2_t) __builtin_neon_vrnd32x_f32((int8x8_t)__rev0, 9);
  68063   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68064   return __ret;
  68065 }
  68066 #endif
  68067 
  68068 #ifdef __LITTLE_ENDIAN__
  68069 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32xq_f64(float64x2_t __p0) {
  68070   float64x2_t __ret;
  68071   __ret = (float64x2_t) __builtin_neon_vrnd32xq_f64((int8x16_t)__p0, 42);
  68072   return __ret;
  68073 }
  68074 #else
  68075 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32xq_f64(float64x2_t __p0) {
  68076   float64x2_t __ret;
  68077   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68078   __ret = (float64x2_t) __builtin_neon_vrnd32xq_f64((int8x16_t)__rev0, 42);
  68079   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68080   return __ret;
  68081 }
  68082 #endif
  68083 
  68084 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd32x_f64(float64x1_t __p0) {
  68085   float64x1_t __ret;
  68086   __ret = (float64x1_t) __builtin_neon_vrnd32x_f64((int8x8_t)__p0, 10);
  68087   return __ret;
  68088 }
  68089 #ifdef __LITTLE_ENDIAN__
  68090 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32zq_f32(float32x4_t __p0) {
  68091   float32x4_t __ret;
  68092   __ret = (float32x4_t) __builtin_neon_vrnd32zq_f32((int8x16_t)__p0, 41);
  68093   return __ret;
  68094 }
  68095 #else
  68096 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32zq_f32(float32x4_t __p0) {
  68097   float32x4_t __ret;
  68098   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68099   __ret = (float32x4_t) __builtin_neon_vrnd32zq_f32((int8x16_t)__rev0, 41);
  68100   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68101   return __ret;
  68102 }
  68103 #endif
  68104 
  68105 #ifdef __LITTLE_ENDIAN__
  68106 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32z_f32(float32x2_t __p0) {
  68107   float32x2_t __ret;
  68108   __ret = (float32x2_t) __builtin_neon_vrnd32z_f32((int8x8_t)__p0, 9);
  68109   return __ret;
  68110 }
  68111 #else
  68112 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32z_f32(float32x2_t __p0) {
  68113   float32x2_t __ret;
  68114   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68115   __ret = (float32x2_t) __builtin_neon_vrnd32z_f32((int8x8_t)__rev0, 9);
  68116   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68117   return __ret;
  68118 }
  68119 #endif
  68120 
  68121 #ifdef __LITTLE_ENDIAN__
  68122 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32zq_f64(float64x2_t __p0) {
  68123   float64x2_t __ret;
  68124   __ret = (float64x2_t) __builtin_neon_vrnd32zq_f64((int8x16_t)__p0, 42);
  68125   return __ret;
  68126 }
  68127 #else
  68128 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32zq_f64(float64x2_t __p0) {
  68129   float64x2_t __ret;
  68130   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68131   __ret = (float64x2_t) __builtin_neon_vrnd32zq_f64((int8x16_t)__rev0, 42);
  68132   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68133   return __ret;
  68134 }
  68135 #endif
  68136 
  68137 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd32z_f64(float64x1_t __p0) {
  68138   float64x1_t __ret;
  68139   __ret = (float64x1_t) __builtin_neon_vrnd32z_f64((int8x8_t)__p0, 10);
  68140   return __ret;
  68141 }
  68142 #ifdef __LITTLE_ENDIAN__
  68143 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64xq_f32(float32x4_t __p0) {
  68144   float32x4_t __ret;
  68145   __ret = (float32x4_t) __builtin_neon_vrnd64xq_f32((int8x16_t)__p0, 41);
  68146   return __ret;
  68147 }
  68148 #else
  68149 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64xq_f32(float32x4_t __p0) {
  68150   float32x4_t __ret;
  68151   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68152   __ret = (float32x4_t) __builtin_neon_vrnd64xq_f32((int8x16_t)__rev0, 41);
  68153   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68154   return __ret;
  68155 }
  68156 #endif
  68157 
  68158 #ifdef __LITTLE_ENDIAN__
  68159 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64x_f32(float32x2_t __p0) {
  68160   float32x2_t __ret;
  68161   __ret = (float32x2_t) __builtin_neon_vrnd64x_f32((int8x8_t)__p0, 9);
  68162   return __ret;
  68163 }
  68164 #else
  68165 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64x_f32(float32x2_t __p0) {
  68166   float32x2_t __ret;
  68167   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68168   __ret = (float32x2_t) __builtin_neon_vrnd64x_f32((int8x8_t)__rev0, 9);
  68169   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68170   return __ret;
  68171 }
  68172 #endif
  68173 
  68174 #ifdef __LITTLE_ENDIAN__
  68175 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64xq_f64(float64x2_t __p0) {
  68176   float64x2_t __ret;
  68177   __ret = (float64x2_t) __builtin_neon_vrnd64xq_f64((int8x16_t)__p0, 42);
  68178   return __ret;
  68179 }
  68180 #else
  68181 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64xq_f64(float64x2_t __p0) {
  68182   float64x2_t __ret;
  68183   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68184   __ret = (float64x2_t) __builtin_neon_vrnd64xq_f64((int8x16_t)__rev0, 42);
  68185   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68186   return __ret;
  68187 }
  68188 #endif
  68189 
  68190 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd64x_f64(float64x1_t __p0) {
  68191   float64x1_t __ret;
  68192   __ret = (float64x1_t) __builtin_neon_vrnd64x_f64((int8x8_t)__p0, 10);
  68193   return __ret;
  68194 }
  68195 #ifdef __LITTLE_ENDIAN__
  68196 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64zq_f32(float32x4_t __p0) {
  68197   float32x4_t __ret;
  68198   __ret = (float32x4_t) __builtin_neon_vrnd64zq_f32((int8x16_t)__p0, 41);
  68199   return __ret;
  68200 }
  68201 #else
  68202 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64zq_f32(float32x4_t __p0) {
  68203   float32x4_t __ret;
  68204   float32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68205   __ret = (float32x4_t) __builtin_neon_vrnd64zq_f32((int8x16_t)__rev0, 41);
  68206   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68207   return __ret;
  68208 }
  68209 #endif
  68210 
  68211 #ifdef __LITTLE_ENDIAN__
  68212 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64z_f32(float32x2_t __p0) {
  68213   float32x2_t __ret;
  68214   __ret = (float32x2_t) __builtin_neon_vrnd64z_f32((int8x8_t)__p0, 9);
  68215   return __ret;
  68216 }
  68217 #else
  68218 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64z_f32(float32x2_t __p0) {
  68219   float32x2_t __ret;
  68220   float32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68221   __ret = (float32x2_t) __builtin_neon_vrnd64z_f32((int8x8_t)__rev0, 9);
  68222   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68223   return __ret;
  68224 }
  68225 #endif
  68226 
  68227 #ifdef __LITTLE_ENDIAN__
  68228 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64zq_f64(float64x2_t __p0) {
  68229   float64x2_t __ret;
  68230   __ret = (float64x2_t) __builtin_neon_vrnd64zq_f64((int8x16_t)__p0, 42);
  68231   return __ret;
  68232 }
  68233 #else
  68234 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64zq_f64(float64x2_t __p0) {
  68235   float64x2_t __ret;
  68236   float64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68237   __ret = (float64x2_t) __builtin_neon_vrnd64zq_f64((int8x16_t)__rev0, 42);
  68238   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68239   return __ret;
  68240 }
  68241 #endif
  68242 
  68243 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd64z_f64(float64x1_t __p0) {
  68244   float64x1_t __ret;
  68245   __ret = (float64x1_t) __builtin_neon_vrnd64z_f64((int8x8_t)__p0, 10);
  68246   return __ret;
  68247 }
  68248 #endif
  68249 #ifdef __LITTLE_ENDIAN__
  68250 #define vbfdotq_lane_f32(__p0_792, __p1_792, __p2_792, __p3_792) __extension__ ({ \
  68251   float32x4_t __ret_792; \
  68252   float32x4_t __s0_792 = __p0_792; \
  68253   bfloat16x8_t __s1_792 = __p1_792; \
  68254   bfloat16x4_t __s2_792 = __p2_792; \
  68255   __ret_792 = vbfdotq_f32(__s0_792, __s1_792, __builtin_bit_cast(bfloat16x8_t, splatq_lane_f32(__builtin_bit_cast(float32x2_t, __s2_792), __p3_792))); \
  68256   __ret_792; \
  68257 })
  68258 #else
  68259 #define vbfdotq_lane_f32(__p0_793, __p1_793, __p2_793, __p3_793) __extension__ ({ \
  68260   float32x4_t __ret_793; \
  68261   float32x4_t __s0_793 = __p0_793; \
  68262   bfloat16x8_t __s1_793 = __p1_793; \
  68263   bfloat16x4_t __s2_793 = __p2_793; \
  68264   float32x4_t __rev0_793;  __rev0_793 = __builtin_shufflevector(__s0_793, __s0_793, 3, 2, 1, 0); \
  68265   bfloat16x8_t __rev1_793;  __rev1_793 = __builtin_shufflevector(__s1_793, __s1_793, 7, 6, 5, 4, 3, 2, 1, 0); \
  68266   bfloat16x4_t __rev2_793;  __rev2_793 = __builtin_shufflevector(__s2_793, __s2_793, 3, 2, 1, 0); \
  68267   __ret_793 = __noswap_vbfdotq_f32(__rev0_793, __rev1_793, __builtin_bit_cast(bfloat16x8_t, __noswap_splatq_lane_f32(__builtin_bit_cast(float32x2_t, __rev2_793), __p3_793))); \
  68268   __ret_793 = __builtin_shufflevector(__ret_793, __ret_793, 3, 2, 1, 0); \
  68269   __ret_793; \
  68270 })
  68271 #endif
  68272 
  68273 #ifdef __LITTLE_ENDIAN__
  68274 #define vbfdot_lane_f32(__p0_794, __p1_794, __p2_794, __p3_794) __extension__ ({ \
  68275   float32x2_t __ret_794; \
  68276   float32x2_t __s0_794 = __p0_794; \
  68277   bfloat16x4_t __s1_794 = __p1_794; \
  68278   bfloat16x4_t __s2_794 = __p2_794; \
  68279   __ret_794 = vbfdot_f32(__s0_794, __s1_794, __builtin_bit_cast(bfloat16x4_t, splat_lane_f32(__builtin_bit_cast(float32x2_t, __s2_794), __p3_794))); \
  68280   __ret_794; \
  68281 })
  68282 #else
  68283 #define vbfdot_lane_f32(__p0_795, __p1_795, __p2_795, __p3_795) __extension__ ({ \
  68284   float32x2_t __ret_795; \
  68285   float32x2_t __s0_795 = __p0_795; \
  68286   bfloat16x4_t __s1_795 = __p1_795; \
  68287   bfloat16x4_t __s2_795 = __p2_795; \
  68288   float32x2_t __rev0_795;  __rev0_795 = __builtin_shufflevector(__s0_795, __s0_795, 1, 0); \
  68289   bfloat16x4_t __rev1_795;  __rev1_795 = __builtin_shufflevector(__s1_795, __s1_795, 3, 2, 1, 0); \
  68290   bfloat16x4_t __rev2_795;  __rev2_795 = __builtin_shufflevector(__s2_795, __s2_795, 3, 2, 1, 0); \
  68291   __ret_795 = __noswap_vbfdot_f32(__rev0_795, __rev1_795, __builtin_bit_cast(bfloat16x4_t, __noswap_splat_lane_f32(__builtin_bit_cast(float32x2_t, __rev2_795), __p3_795))); \
  68292   __ret_795 = __builtin_shufflevector(__ret_795, __ret_795, 1, 0); \
  68293   __ret_795; \
  68294 })
  68295 #endif
  68296 
  68297 #ifdef __LITTLE_ENDIAN__
  68298 #define vbfdotq_laneq_f32(__p0_796, __p1_796, __p2_796, __p3_796) __extension__ ({ \
  68299   float32x4_t __ret_796; \
  68300   float32x4_t __s0_796 = __p0_796; \
  68301   bfloat16x8_t __s1_796 = __p1_796; \
  68302   bfloat16x8_t __s2_796 = __p2_796; \
  68303   __ret_796 = vbfdotq_f32(__s0_796, __s1_796, __builtin_bit_cast(bfloat16x8_t, splatq_laneq_f32(__builtin_bit_cast(float32x4_t, __s2_796), __p3_796))); \
  68304   __ret_796; \
  68305 })
  68306 #else
  68307 #define vbfdotq_laneq_f32(__p0_797, __p1_797, __p2_797, __p3_797) __extension__ ({ \
  68308   float32x4_t __ret_797; \
  68309   float32x4_t __s0_797 = __p0_797; \
  68310   bfloat16x8_t __s1_797 = __p1_797; \
  68311   bfloat16x8_t __s2_797 = __p2_797; \
  68312   float32x4_t __rev0_797;  __rev0_797 = __builtin_shufflevector(__s0_797, __s0_797, 3, 2, 1, 0); \
  68313   bfloat16x8_t __rev1_797;  __rev1_797 = __builtin_shufflevector(__s1_797, __s1_797, 7, 6, 5, 4, 3, 2, 1, 0); \
  68314   bfloat16x8_t __rev2_797;  __rev2_797 = __builtin_shufflevector(__s2_797, __s2_797, 7, 6, 5, 4, 3, 2, 1, 0); \
  68315   __ret_797 = __noswap_vbfdotq_f32(__rev0_797, __rev1_797, __builtin_bit_cast(bfloat16x8_t, __noswap_splatq_laneq_f32(__builtin_bit_cast(float32x4_t, __rev2_797), __p3_797))); \
  68316   __ret_797 = __builtin_shufflevector(__ret_797, __ret_797, 3, 2, 1, 0); \
  68317   __ret_797; \
  68318 })
  68319 #endif
  68320 
  68321 #ifdef __LITTLE_ENDIAN__
  68322 #define vbfdot_laneq_f32(__p0_798, __p1_798, __p2_798, __p3_798) __extension__ ({ \
  68323   float32x2_t __ret_798; \
  68324   float32x2_t __s0_798 = __p0_798; \
  68325   bfloat16x4_t __s1_798 = __p1_798; \
  68326   bfloat16x8_t __s2_798 = __p2_798; \
  68327   __ret_798 = vbfdot_f32(__s0_798, __s1_798, __builtin_bit_cast(bfloat16x4_t, splat_laneq_f32(__builtin_bit_cast(float32x4_t, __s2_798), __p3_798))); \
  68328   __ret_798; \
  68329 })
  68330 #else
  68331 #define vbfdot_laneq_f32(__p0_799, __p1_799, __p2_799, __p3_799) __extension__ ({ \
  68332   float32x2_t __ret_799; \
  68333   float32x2_t __s0_799 = __p0_799; \
  68334   bfloat16x4_t __s1_799 = __p1_799; \
  68335   bfloat16x8_t __s2_799 = __p2_799; \
  68336   float32x2_t __rev0_799;  __rev0_799 = __builtin_shufflevector(__s0_799, __s0_799, 1, 0); \
  68337   bfloat16x4_t __rev1_799;  __rev1_799 = __builtin_shufflevector(__s1_799, __s1_799, 3, 2, 1, 0); \
  68338   bfloat16x8_t __rev2_799;  __rev2_799 = __builtin_shufflevector(__s2_799, __s2_799, 7, 6, 5, 4, 3, 2, 1, 0); \
  68339   __ret_799 = __noswap_vbfdot_f32(__rev0_799, __rev1_799, __builtin_bit_cast(bfloat16x4_t, __noswap_splat_laneq_f32(__builtin_bit_cast(float32x4_t, __rev2_799), __p3_799))); \
  68340   __ret_799 = __builtin_shufflevector(__ret_799, __ret_799, 1, 0); \
  68341   __ret_799; \
  68342 })
  68343 #endif
  68344 
  68345 #ifdef __LITTLE_ENDIAN__
  68346 #define vbfmlalbq_lane_f32(__p0_800, __p1_800, __p2_800, __p3_800) __extension__ ({ \
  68347   float32x4_t __ret_800; \
  68348   float32x4_t __s0_800 = __p0_800; \
  68349   bfloat16x8_t __s1_800 = __p1_800; \
  68350   bfloat16x4_t __s2_800 = __p2_800; \
  68351   __ret_800 = vbfmlalbq_f32(__s0_800, __s1_800, (bfloat16x8_t) {vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800)}); \
  68352   __ret_800; \
  68353 })
  68354 #else
  68355 #define vbfmlalbq_lane_f32(__p0_801, __p1_801, __p2_801, __p3_801) __extension__ ({ \
  68356   float32x4_t __ret_801; \
  68357   float32x4_t __s0_801 = __p0_801; \
  68358   bfloat16x8_t __s1_801 = __p1_801; \
  68359   bfloat16x4_t __s2_801 = __p2_801; \
  68360   float32x4_t __rev0_801;  __rev0_801 = __builtin_shufflevector(__s0_801, __s0_801, 3, 2, 1, 0); \
  68361   bfloat16x8_t __rev1_801;  __rev1_801 = __builtin_shufflevector(__s1_801, __s1_801, 7, 6, 5, 4, 3, 2, 1, 0); \
  68362   bfloat16x4_t __rev2_801;  __rev2_801 = __builtin_shufflevector(__s2_801, __s2_801, 3, 2, 1, 0); \
  68363   __ret_801 = __noswap_vbfmlalbq_f32(__rev0_801, __rev1_801, (bfloat16x8_t) {__noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801)}); \
  68364   __ret_801 = __builtin_shufflevector(__ret_801, __ret_801, 3, 2, 1, 0); \
  68365   __ret_801; \
  68366 })
  68367 #endif
  68368 
  68369 #ifdef __LITTLE_ENDIAN__
  68370 #define vbfmlalbq_laneq_f32(__p0_802, __p1_802, __p2_802, __p3_802) __extension__ ({ \
  68371   float32x4_t __ret_802; \
  68372   float32x4_t __s0_802 = __p0_802; \
  68373   bfloat16x8_t __s1_802 = __p1_802; \
  68374   bfloat16x8_t __s2_802 = __p2_802; \
  68375   __ret_802 = vbfmlalbq_f32(__s0_802, __s1_802, (bfloat16x8_t) {vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802)}); \
  68376   __ret_802; \
  68377 })
  68378 #else
  68379 #define vbfmlalbq_laneq_f32(__p0_803, __p1_803, __p2_803, __p3_803) __extension__ ({ \
  68380   float32x4_t __ret_803; \
  68381   float32x4_t __s0_803 = __p0_803; \
  68382   bfloat16x8_t __s1_803 = __p1_803; \
  68383   bfloat16x8_t __s2_803 = __p2_803; \
  68384   float32x4_t __rev0_803;  __rev0_803 = __builtin_shufflevector(__s0_803, __s0_803, 3, 2, 1, 0); \
  68385   bfloat16x8_t __rev1_803;  __rev1_803 = __builtin_shufflevector(__s1_803, __s1_803, 7, 6, 5, 4, 3, 2, 1, 0); \
  68386   bfloat16x8_t __rev2_803;  __rev2_803 = __builtin_shufflevector(__s2_803, __s2_803, 7, 6, 5, 4, 3, 2, 1, 0); \
  68387   __ret_803 = __noswap_vbfmlalbq_f32(__rev0_803, __rev1_803, (bfloat16x8_t) {__noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803)}); \
  68388   __ret_803 = __builtin_shufflevector(__ret_803, __ret_803, 3, 2, 1, 0); \
  68389   __ret_803; \
  68390 })
  68391 #endif
  68392 
  68393 #ifdef __LITTLE_ENDIAN__
  68394 #define vbfmlaltq_lane_f32(__p0_804, __p1_804, __p2_804, __p3_804) __extension__ ({ \
  68395   float32x4_t __ret_804; \
  68396   float32x4_t __s0_804 = __p0_804; \
  68397   bfloat16x8_t __s1_804 = __p1_804; \
  68398   bfloat16x4_t __s2_804 = __p2_804; \
  68399   __ret_804 = vbfmlaltq_f32(__s0_804, __s1_804, (bfloat16x8_t) {vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804)}); \
  68400   __ret_804; \
  68401 })
  68402 #else
  68403 #define vbfmlaltq_lane_f32(__p0_805, __p1_805, __p2_805, __p3_805) __extension__ ({ \
  68404   float32x4_t __ret_805; \
  68405   float32x4_t __s0_805 = __p0_805; \
  68406   bfloat16x8_t __s1_805 = __p1_805; \
  68407   bfloat16x4_t __s2_805 = __p2_805; \
  68408   float32x4_t __rev0_805;  __rev0_805 = __builtin_shufflevector(__s0_805, __s0_805, 3, 2, 1, 0); \
  68409   bfloat16x8_t __rev1_805;  __rev1_805 = __builtin_shufflevector(__s1_805, __s1_805, 7, 6, 5, 4, 3, 2, 1, 0); \
  68410   bfloat16x4_t __rev2_805;  __rev2_805 = __builtin_shufflevector(__s2_805, __s2_805, 3, 2, 1, 0); \
  68411   __ret_805 = __noswap_vbfmlaltq_f32(__rev0_805, __rev1_805, (bfloat16x8_t) {__noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805)}); \
  68412   __ret_805 = __builtin_shufflevector(__ret_805, __ret_805, 3, 2, 1, 0); \
  68413   __ret_805; \
  68414 })
  68415 #endif
  68416 
  68417 #ifdef __LITTLE_ENDIAN__
  68418 #define vbfmlaltq_laneq_f32(__p0_806, __p1_806, __p2_806, __p3_806) __extension__ ({ \
  68419   float32x4_t __ret_806; \
  68420   float32x4_t __s0_806 = __p0_806; \
  68421   bfloat16x8_t __s1_806 = __p1_806; \
  68422   bfloat16x8_t __s2_806 = __p2_806; \
  68423   __ret_806 = vbfmlaltq_f32(__s0_806, __s1_806, (bfloat16x8_t) {vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806)}); \
  68424   __ret_806; \
  68425 })
  68426 #else
  68427 #define vbfmlaltq_laneq_f32(__p0_807, __p1_807, __p2_807, __p3_807) __extension__ ({ \
  68428   float32x4_t __ret_807; \
  68429   float32x4_t __s0_807 = __p0_807; \
  68430   bfloat16x8_t __s1_807 = __p1_807; \
  68431   bfloat16x8_t __s2_807 = __p2_807; \
  68432   float32x4_t __rev0_807;  __rev0_807 = __builtin_shufflevector(__s0_807, __s0_807, 3, 2, 1, 0); \
  68433   bfloat16x8_t __rev1_807;  __rev1_807 = __builtin_shufflevector(__s1_807, __s1_807, 7, 6, 5, 4, 3, 2, 1, 0); \
  68434   bfloat16x8_t __rev2_807;  __rev2_807 = __builtin_shufflevector(__s2_807, __s2_807, 7, 6, 5, 4, 3, 2, 1, 0); \
  68435   __ret_807 = __noswap_vbfmlaltq_f32(__rev0_807, __rev1_807, (bfloat16x8_t) {__noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807)}); \
  68436   __ret_807 = __builtin_shufflevector(__ret_807, __ret_807, 3, 2, 1, 0); \
  68437   __ret_807; \
  68438 })
  68439 #endif
  68440 
  68441 #ifdef __LITTLE_ENDIAN__
  68442 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvt_f32_bf16(bfloat16x4_t __p0_808) {
  68443   float32x4_t __ret_808;
  68444   __ret_808 = __builtin_bit_cast(float32x4_t, vshll_n_u16(__builtin_bit_cast(uint16x4_t, __p0_808), 16));
  68445   return __ret_808;
  68446 }
  68447 #else
  68448 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvt_f32_bf16(bfloat16x4_t __p0_809) {
  68449   float32x4_t __ret_809;
  68450   bfloat16x4_t __rev0_809;  __rev0_809 = __builtin_shufflevector(__p0_809, __p0_809, 3, 2, 1, 0);
  68451   __ret_809 = __builtin_bit_cast(float32x4_t, __noswap_vshll_n_u16(__builtin_bit_cast(uint16x4_t, __rev0_809), 16));
  68452   __ret_809 = __builtin_shufflevector(__ret_809, __ret_809, 3, 2, 1, 0);
  68453   return __ret_809;
  68454 }
  68455 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vcvt_f32_bf16(bfloat16x4_t __p0_810) {
  68456   float32x4_t __ret_810;
  68457   __ret_810 = __builtin_bit_cast(float32x4_t, __noswap_vshll_n_u16(__builtin_bit_cast(uint16x4_t, __p0_810), 16));
  68458   return __ret_810;
  68459 }
  68460 #endif
  68461 
  68462 #ifdef __LITTLE_ENDIAN__
  68463 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_high_f32_bf16(bfloat16x8_t __p0) {
  68464   float32x4_t __ret;
  68465   __ret = vcvt_f32_bf16(vget_high_bf16(__p0));
  68466   return __ret;
  68467 }
  68468 #else
  68469 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_high_f32_bf16(bfloat16x8_t __p0) {
  68470   float32x4_t __ret;
  68471   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68472   __ret = __noswap_vcvt_f32_bf16(__noswap_vget_high_bf16(__rev0));
  68473   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68474   return __ret;
  68475 }
  68476 #endif
  68477 
  68478 #ifdef __LITTLE_ENDIAN__
  68479 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_low_f32_bf16(bfloat16x8_t __p0) {
  68480   float32x4_t __ret;
  68481   __ret = vcvt_f32_bf16(vget_low_bf16(__p0));
  68482   return __ret;
  68483 }
  68484 #else
  68485 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_low_f32_bf16(bfloat16x8_t __p0) {
  68486   float32x4_t __ret;
  68487   bfloat16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68488   __ret = __noswap_vcvt_f32_bf16(__noswap_vget_low_bf16(__rev0));
  68489   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68490   return __ret;
  68491 }
  68492 #endif
  68493 
  68494 #ifdef __LITTLE_ENDIAN__
  68495 #define vdotq_lane_u32(__p0_811, __p1_811, __p2_811, __p3_811) __extension__ ({ \
  68496   uint32x4_t __ret_811; \
  68497   uint32x4_t __s0_811 = __p0_811; \
  68498   uint8x16_t __s1_811 = __p1_811; \
  68499   uint8x8_t __s2_811 = __p2_811; \
  68500   __ret_811 = vdotq_u32(__s0_811, __s1_811, __builtin_bit_cast(uint8x16_t, splatq_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_811), __p3_811))); \
  68501   __ret_811; \
  68502 })
  68503 #else
  68504 #define vdotq_lane_u32(__p0_812, __p1_812, __p2_812, __p3_812) __extension__ ({ \
  68505   uint32x4_t __ret_812; \
  68506   uint32x4_t __s0_812 = __p0_812; \
  68507   uint8x16_t __s1_812 = __p1_812; \
  68508   uint8x8_t __s2_812 = __p2_812; \
  68509   uint32x4_t __rev0_812;  __rev0_812 = __builtin_shufflevector(__s0_812, __s0_812, 3, 2, 1, 0); \
  68510   uint8x16_t __rev1_812;  __rev1_812 = __builtin_shufflevector(__s1_812, __s1_812, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  68511   uint8x8_t __rev2_812;  __rev2_812 = __builtin_shufflevector(__s2_812, __s2_812, 7, 6, 5, 4, 3, 2, 1, 0); \
  68512   __ret_812 = __noswap_vdotq_u32(__rev0_812, __rev1_812, __builtin_bit_cast(uint8x16_t, __noswap_splatq_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_812), __p3_812))); \
  68513   __ret_812 = __builtin_shufflevector(__ret_812, __ret_812, 3, 2, 1, 0); \
  68514   __ret_812; \
  68515 })
  68516 #endif
  68517 
  68518 #ifdef __LITTLE_ENDIAN__
  68519 #define vdotq_lane_s32(__p0_813, __p1_813, __p2_813, __p3_813) __extension__ ({ \
  68520   int32x4_t __ret_813; \
  68521   int32x4_t __s0_813 = __p0_813; \
  68522   int8x16_t __s1_813 = __p1_813; \
  68523   int8x8_t __s2_813 = __p2_813; \
  68524   __ret_813 = vdotq_s32(__s0_813, __s1_813, __builtin_bit_cast(int8x16_t, splatq_lane_s32(__builtin_bit_cast(int32x2_t, __s2_813), __p3_813))); \
  68525   __ret_813; \
  68526 })
  68527 #else
  68528 #define vdotq_lane_s32(__p0_814, __p1_814, __p2_814, __p3_814) __extension__ ({ \
  68529   int32x4_t __ret_814; \
  68530   int32x4_t __s0_814 = __p0_814; \
  68531   int8x16_t __s1_814 = __p1_814; \
  68532   int8x8_t __s2_814 = __p2_814; \
  68533   int32x4_t __rev0_814;  __rev0_814 = __builtin_shufflevector(__s0_814, __s0_814, 3, 2, 1, 0); \
  68534   int8x16_t __rev1_814;  __rev1_814 = __builtin_shufflevector(__s1_814, __s1_814, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  68535   int8x8_t __rev2_814;  __rev2_814 = __builtin_shufflevector(__s2_814, __s2_814, 7, 6, 5, 4, 3, 2, 1, 0); \
  68536   __ret_814 = __noswap_vdotq_s32(__rev0_814, __rev1_814, __builtin_bit_cast(int8x16_t, __noswap_splatq_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_814), __p3_814))); \
  68537   __ret_814 = __builtin_shufflevector(__ret_814, __ret_814, 3, 2, 1, 0); \
  68538   __ret_814; \
  68539 })
  68540 #endif
  68541 
  68542 #ifdef __LITTLE_ENDIAN__
  68543 #define vdot_lane_u32(__p0_815, __p1_815, __p2_815, __p3_815) __extension__ ({ \
  68544   uint32x2_t __ret_815; \
  68545   uint32x2_t __s0_815 = __p0_815; \
  68546   uint8x8_t __s1_815 = __p1_815; \
  68547   uint8x8_t __s2_815 = __p2_815; \
  68548   __ret_815 = vdot_u32(__s0_815, __s1_815, __builtin_bit_cast(uint8x8_t, splat_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_815), __p3_815))); \
  68549   __ret_815; \
  68550 })
  68551 #else
  68552 #define vdot_lane_u32(__p0_816, __p1_816, __p2_816, __p3_816) __extension__ ({ \
  68553   uint32x2_t __ret_816; \
  68554   uint32x2_t __s0_816 = __p0_816; \
  68555   uint8x8_t __s1_816 = __p1_816; \
  68556   uint8x8_t __s2_816 = __p2_816; \
  68557   uint32x2_t __rev0_816;  __rev0_816 = __builtin_shufflevector(__s0_816, __s0_816, 1, 0); \
  68558   uint8x8_t __rev1_816;  __rev1_816 = __builtin_shufflevector(__s1_816, __s1_816, 7, 6, 5, 4, 3, 2, 1, 0); \
  68559   uint8x8_t __rev2_816;  __rev2_816 = __builtin_shufflevector(__s2_816, __s2_816, 7, 6, 5, 4, 3, 2, 1, 0); \
  68560   __ret_816 = __noswap_vdot_u32(__rev0_816, __rev1_816, __builtin_bit_cast(uint8x8_t, __noswap_splat_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_816), __p3_816))); \
  68561   __ret_816 = __builtin_shufflevector(__ret_816, __ret_816, 1, 0); \
  68562   __ret_816; \
  68563 })
  68564 #endif
  68565 
  68566 #ifdef __LITTLE_ENDIAN__
  68567 #define vdot_lane_s32(__p0_817, __p1_817, __p2_817, __p3_817) __extension__ ({ \
  68568   int32x2_t __ret_817; \
  68569   int32x2_t __s0_817 = __p0_817; \
  68570   int8x8_t __s1_817 = __p1_817; \
  68571   int8x8_t __s2_817 = __p2_817; \
  68572   __ret_817 = vdot_s32(__s0_817, __s1_817, __builtin_bit_cast(int8x8_t, splat_lane_s32(__builtin_bit_cast(int32x2_t, __s2_817), __p3_817))); \
  68573   __ret_817; \
  68574 })
  68575 #else
  68576 #define vdot_lane_s32(__p0_818, __p1_818, __p2_818, __p3_818) __extension__ ({ \
  68577   int32x2_t __ret_818; \
  68578   int32x2_t __s0_818 = __p0_818; \
  68579   int8x8_t __s1_818 = __p1_818; \
  68580   int8x8_t __s2_818 = __p2_818; \
  68581   int32x2_t __rev0_818;  __rev0_818 = __builtin_shufflevector(__s0_818, __s0_818, 1, 0); \
  68582   int8x8_t __rev1_818;  __rev1_818 = __builtin_shufflevector(__s1_818, __s1_818, 7, 6, 5, 4, 3, 2, 1, 0); \
  68583   int8x8_t __rev2_818;  __rev2_818 = __builtin_shufflevector(__s2_818, __s2_818, 7, 6, 5, 4, 3, 2, 1, 0); \
  68584   __ret_818 = __noswap_vdot_s32(__rev0_818, __rev1_818, __builtin_bit_cast(int8x8_t, __noswap_splat_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_818), __p3_818))); \
  68585   __ret_818 = __builtin_shufflevector(__ret_818, __ret_818, 1, 0); \
  68586   __ret_818; \
  68587 })
  68588 #endif
  68589 
  68590 #ifdef __LITTLE_ENDIAN__
  68591 #define vmulq_lane_f16(__p0_819, __p1_819, __p2_819) __extension__ ({ \
  68592   float16x8_t __ret_819; \
  68593   float16x8_t __s0_819 = __p0_819; \
  68594   float16x4_t __s1_819 = __p1_819; \
  68595   __ret_819 = __s0_819 * splatq_lane_f16(__s1_819, __p2_819); \
  68596   __ret_819; \
  68597 })
  68598 #else
  68599 #define vmulq_lane_f16(__p0_820, __p1_820, __p2_820) __extension__ ({ \
  68600   float16x8_t __ret_820; \
  68601   float16x8_t __s0_820 = __p0_820; \
  68602   float16x4_t __s1_820 = __p1_820; \
  68603   float16x8_t __rev0_820;  __rev0_820 = __builtin_shufflevector(__s0_820, __s0_820, 7, 6, 5, 4, 3, 2, 1, 0); \
  68604   float16x4_t __rev1_820;  __rev1_820 = __builtin_shufflevector(__s1_820, __s1_820, 3, 2, 1, 0); \
  68605   __ret_820 = __rev0_820 * __noswap_splatq_lane_f16(__rev1_820, __p2_820); \
  68606   __ret_820 = __builtin_shufflevector(__ret_820, __ret_820, 7, 6, 5, 4, 3, 2, 1, 0); \
  68607   __ret_820; \
  68608 })
  68609 #endif
  68610 
  68611 #ifdef __LITTLE_ENDIAN__
  68612 #define vmul_lane_f16(__p0_821, __p1_821, __p2_821) __extension__ ({ \
  68613   float16x4_t __ret_821; \
  68614   float16x4_t __s0_821 = __p0_821; \
  68615   float16x4_t __s1_821 = __p1_821; \
  68616   __ret_821 = __s0_821 * splat_lane_f16(__s1_821, __p2_821); \
  68617   __ret_821; \
  68618 })
  68619 #else
  68620 #define vmul_lane_f16(__p0_822, __p1_822, __p2_822) __extension__ ({ \
  68621   float16x4_t __ret_822; \
  68622   float16x4_t __s0_822 = __p0_822; \
  68623   float16x4_t __s1_822 = __p1_822; \
  68624   float16x4_t __rev0_822;  __rev0_822 = __builtin_shufflevector(__s0_822, __s0_822, 3, 2, 1, 0); \
  68625   float16x4_t __rev1_822;  __rev1_822 = __builtin_shufflevector(__s1_822, __s1_822, 3, 2, 1, 0); \
  68626   __ret_822 = __rev0_822 * __noswap_splat_lane_f16(__rev1_822, __p2_822); \
  68627   __ret_822 = __builtin_shufflevector(__ret_822, __ret_822, 3, 2, 1, 0); \
  68628   __ret_822; \
  68629 })
  68630 #endif
  68631 
  68632 #ifdef __LITTLE_ENDIAN__
  68633 #define vsudotq_lane_s32(__p0_823, __p1_823, __p2_823, __p3_823) __extension__ ({ \
  68634   int32x4_t __ret_823; \
  68635   int32x4_t __s0_823 = __p0_823; \
  68636   int8x16_t __s1_823 = __p1_823; \
  68637   uint8x8_t __s2_823 = __p2_823; \
  68638   __ret_823 = vusdotq_s32(__s0_823, (uint8x16_t)(splatq_lane_s32(__builtin_bit_cast(int32x2_t, __s2_823), __p3_823)), __s1_823); \
  68639   __ret_823; \
  68640 })
  68641 #else
  68642 #define vsudotq_lane_s32(__p0_824, __p1_824, __p2_824, __p3_824) __extension__ ({ \
  68643   int32x4_t __ret_824; \
  68644   int32x4_t __s0_824 = __p0_824; \
  68645   int8x16_t __s1_824 = __p1_824; \
  68646   uint8x8_t __s2_824 = __p2_824; \
  68647   int32x4_t __rev0_824;  __rev0_824 = __builtin_shufflevector(__s0_824, __s0_824, 3, 2, 1, 0); \
  68648   int8x16_t __rev1_824;  __rev1_824 = __builtin_shufflevector(__s1_824, __s1_824, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  68649   uint8x8_t __rev2_824;  __rev2_824 = __builtin_shufflevector(__s2_824, __s2_824, 7, 6, 5, 4, 3, 2, 1, 0); \
  68650   __ret_824 = __noswap_vusdotq_s32(__rev0_824, (uint8x16_t)(__noswap_splatq_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_824), __p3_824)), __rev1_824); \
  68651   __ret_824 = __builtin_shufflevector(__ret_824, __ret_824, 3, 2, 1, 0); \
  68652   __ret_824; \
  68653 })
  68654 #endif
  68655 
  68656 #ifdef __LITTLE_ENDIAN__
  68657 #define vsudot_lane_s32(__p0_825, __p1_825, __p2_825, __p3_825) __extension__ ({ \
  68658   int32x2_t __ret_825; \
  68659   int32x2_t __s0_825 = __p0_825; \
  68660   int8x8_t __s1_825 = __p1_825; \
  68661   uint8x8_t __s2_825 = __p2_825; \
  68662   __ret_825 = vusdot_s32(__s0_825, (uint8x8_t)(splat_lane_s32(__builtin_bit_cast(int32x2_t, __s2_825), __p3_825)), __s1_825); \
  68663   __ret_825; \
  68664 })
  68665 #else
  68666 #define vsudot_lane_s32(__p0_826, __p1_826, __p2_826, __p3_826) __extension__ ({ \
  68667   int32x2_t __ret_826; \
  68668   int32x2_t __s0_826 = __p0_826; \
  68669   int8x8_t __s1_826 = __p1_826; \
  68670   uint8x8_t __s2_826 = __p2_826; \
  68671   int32x2_t __rev0_826;  __rev0_826 = __builtin_shufflevector(__s0_826, __s0_826, 1, 0); \
  68672   int8x8_t __rev1_826;  __rev1_826 = __builtin_shufflevector(__s1_826, __s1_826, 7, 6, 5, 4, 3, 2, 1, 0); \
  68673   uint8x8_t __rev2_826;  __rev2_826 = __builtin_shufflevector(__s2_826, __s2_826, 7, 6, 5, 4, 3, 2, 1, 0); \
  68674   __ret_826 = __noswap_vusdot_s32(__rev0_826, (uint8x8_t)(__noswap_splat_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_826), __p3_826)), __rev1_826); \
  68675   __ret_826 = __builtin_shufflevector(__ret_826, __ret_826, 1, 0); \
  68676   __ret_826; \
  68677 })
  68678 #endif
  68679 
  68680 #ifdef __LITTLE_ENDIAN__
  68681 #define vusdotq_lane_s32(__p0_827, __p1_827, __p2_827, __p3_827) __extension__ ({ \
  68682   int32x4_t __ret_827; \
  68683   int32x4_t __s0_827 = __p0_827; \
  68684   uint8x16_t __s1_827 = __p1_827; \
  68685   int8x8_t __s2_827 = __p2_827; \
  68686   __ret_827 = vusdotq_s32(__s0_827, __s1_827, (int8x16_t)(splatq_lane_s32(__builtin_bit_cast(int32x2_t, __s2_827), __p3_827))); \
  68687   __ret_827; \
  68688 })
  68689 #else
  68690 #define vusdotq_lane_s32(__p0_828, __p1_828, __p2_828, __p3_828) __extension__ ({ \
  68691   int32x4_t __ret_828; \
  68692   int32x4_t __s0_828 = __p0_828; \
  68693   uint8x16_t __s1_828 = __p1_828; \
  68694   int8x8_t __s2_828 = __p2_828; \
  68695   int32x4_t __rev0_828;  __rev0_828 = __builtin_shufflevector(__s0_828, __s0_828, 3, 2, 1, 0); \
  68696   uint8x16_t __rev1_828;  __rev1_828 = __builtin_shufflevector(__s1_828, __s1_828, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \
  68697   int8x8_t __rev2_828;  __rev2_828 = __builtin_shufflevector(__s2_828, __s2_828, 7, 6, 5, 4, 3, 2, 1, 0); \
  68698   __ret_828 = __noswap_vusdotq_s32(__rev0_828, __rev1_828, (int8x16_t)(__noswap_splatq_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_828), __p3_828))); \
  68699   __ret_828 = __builtin_shufflevector(__ret_828, __ret_828, 3, 2, 1, 0); \
  68700   __ret_828; \
  68701 })
  68702 #endif
  68703 
  68704 #ifdef __LITTLE_ENDIAN__
  68705 #define vusdot_lane_s32(__p0_829, __p1_829, __p2_829, __p3_829) __extension__ ({ \
  68706   int32x2_t __ret_829; \
  68707   int32x2_t __s0_829 = __p0_829; \
  68708   uint8x8_t __s1_829 = __p1_829; \
  68709   int8x8_t __s2_829 = __p2_829; \
  68710   __ret_829 = vusdot_s32(__s0_829, __s1_829, (int8x8_t)(splat_lane_s32(__builtin_bit_cast(int32x2_t, __s2_829), __p3_829))); \
  68711   __ret_829; \
  68712 })
  68713 #else
  68714 #define vusdot_lane_s32(__p0_830, __p1_830, __p2_830, __p3_830) __extension__ ({ \
  68715   int32x2_t __ret_830; \
  68716   int32x2_t __s0_830 = __p0_830; \
  68717   uint8x8_t __s1_830 = __p1_830; \
  68718   int8x8_t __s2_830 = __p2_830; \
  68719   int32x2_t __rev0_830;  __rev0_830 = __builtin_shufflevector(__s0_830, __s0_830, 1, 0); \
  68720   uint8x8_t __rev1_830;  __rev1_830 = __builtin_shufflevector(__s1_830, __s1_830, 7, 6, 5, 4, 3, 2, 1, 0); \
  68721   int8x8_t __rev2_830;  __rev2_830 = __builtin_shufflevector(__s2_830, __s2_830, 7, 6, 5, 4, 3, 2, 1, 0); \
  68722   __ret_830 = __noswap_vusdot_s32(__rev0_830, __rev1_830, (int8x8_t)(__noswap_splat_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_830), __p3_830))); \
  68723   __ret_830 = __builtin_shufflevector(__ret_830, __ret_830, 1, 0); \
  68724   __ret_830; \
  68725 })
  68726 #endif
  68727 
  68728 #ifdef __LITTLE_ENDIAN__
  68729 __ai __attribute__((target("neon"))) uint8x16_t vabaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  68730   uint8x16_t __ret;
  68731   __ret = __p0 + vabdq_u8(__p1, __p2);
  68732   return __ret;
  68733 }
  68734 #else
  68735 __ai __attribute__((target("neon"))) uint8x16_t vabaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  68736   uint8x16_t __ret;
  68737   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68738   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68739   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68740   __ret = __rev0 + __noswap_vabdq_u8(__rev1, __rev2);
  68741   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68742   return __ret;
  68743 }
  68744 #endif
  68745 
  68746 #ifdef __LITTLE_ENDIAN__
  68747 __ai __attribute__((target("neon"))) uint32x4_t vabaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  68748   uint32x4_t __ret;
  68749   __ret = __p0 + vabdq_u32(__p1, __p2);
  68750   return __ret;
  68751 }
  68752 #else
  68753 __ai __attribute__((target("neon"))) uint32x4_t vabaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  68754   uint32x4_t __ret;
  68755   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68756   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  68757   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  68758   __ret = __rev0 + __noswap_vabdq_u32(__rev1, __rev2);
  68759   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68760   return __ret;
  68761 }
  68762 #endif
  68763 
  68764 #ifdef __LITTLE_ENDIAN__
  68765 __ai __attribute__((target("neon"))) uint16x8_t vabaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  68766   uint16x8_t __ret;
  68767   __ret = __p0 + vabdq_u16(__p1, __p2);
  68768   return __ret;
  68769 }
  68770 #else
  68771 __ai __attribute__((target("neon"))) uint16x8_t vabaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  68772   uint16x8_t __ret;
  68773   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68774   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  68775   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  68776   __ret = __rev0 + __noswap_vabdq_u16(__rev1, __rev2);
  68777   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  68778   return __ret;
  68779 }
  68780 #endif
  68781 
  68782 #ifdef __LITTLE_ENDIAN__
  68783 __ai __attribute__((target("neon"))) int8x16_t vabaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  68784   int8x16_t __ret;
  68785   __ret = __p0 + vabdq_s8(__p1, __p2);
  68786   return __ret;
  68787 }
  68788 #else
  68789 __ai __attribute__((target("neon"))) int8x16_t vabaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) {
  68790   int8x16_t __ret;
  68791   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68792   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68793   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68794   __ret = __rev0 + __noswap_vabdq_s8(__rev1, __rev2);
  68795   __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  68796   return __ret;
  68797 }
  68798 #endif
  68799 
  68800 #ifdef __LITTLE_ENDIAN__
  68801 __ai __attribute__((target("neon"))) int32x4_t vabaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  68802   int32x4_t __ret;
  68803   __ret = __p0 + vabdq_s32(__p1, __p2);
  68804   return __ret;
  68805 }
  68806 #else
  68807 __ai __attribute__((target("neon"))) int32x4_t vabaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) {
  68808   int32x4_t __ret;
  68809   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68810   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  68811   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  68812   __ret = __rev0 + __noswap_vabdq_s32(__rev1, __rev2);
  68813   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68814   return __ret;
  68815 }
  68816 #endif
  68817 
  68818 #ifdef __LITTLE_ENDIAN__
  68819 __ai __attribute__((target("neon"))) int16x8_t vabaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  68820   int16x8_t __ret;
  68821   __ret = __p0 + vabdq_s16(__p1, __p2);
  68822   return __ret;
  68823 }
  68824 #else
  68825 __ai __attribute__((target("neon"))) int16x8_t vabaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) {
  68826   int16x8_t __ret;
  68827   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68828   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  68829   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  68830   __ret = __rev0 + __noswap_vabdq_s16(__rev1, __rev2);
  68831   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  68832   return __ret;
  68833 }
  68834 #endif
  68835 
  68836 #ifdef __LITTLE_ENDIAN__
  68837 __ai __attribute__((target("neon"))) uint8x8_t vaba_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  68838   uint8x8_t __ret;
  68839   __ret = __p0 + vabd_u8(__p1, __p2);
  68840   return __ret;
  68841 }
  68842 #else
  68843 __ai __attribute__((target("neon"))) uint8x8_t vaba_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  68844   uint8x8_t __ret;
  68845   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68846   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  68847   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  68848   __ret = __rev0 + __noswap_vabd_u8(__rev1, __rev2);
  68849   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  68850   return __ret;
  68851 }
  68852 #endif
  68853 
  68854 #ifdef __LITTLE_ENDIAN__
  68855 __ai __attribute__((target("neon"))) uint32x2_t vaba_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  68856   uint32x2_t __ret;
  68857   __ret = __p0 + vabd_u32(__p1, __p2);
  68858   return __ret;
  68859 }
  68860 #else
  68861 __ai __attribute__((target("neon"))) uint32x2_t vaba_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  68862   uint32x2_t __ret;
  68863   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68864   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  68865   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  68866   __ret = __rev0 + __noswap_vabd_u32(__rev1, __rev2);
  68867   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68868   return __ret;
  68869 }
  68870 #endif
  68871 
  68872 #ifdef __LITTLE_ENDIAN__
  68873 __ai __attribute__((target("neon"))) uint16x4_t vaba_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  68874   uint16x4_t __ret;
  68875   __ret = __p0 + vabd_u16(__p1, __p2);
  68876   return __ret;
  68877 }
  68878 #else
  68879 __ai __attribute__((target("neon"))) uint16x4_t vaba_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  68880   uint16x4_t __ret;
  68881   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68882   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  68883   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  68884   __ret = __rev0 + __noswap_vabd_u16(__rev1, __rev2);
  68885   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68886   return __ret;
  68887 }
  68888 #endif
  68889 
  68890 #ifdef __LITTLE_ENDIAN__
  68891 __ai __attribute__((target("neon"))) int8x8_t vaba_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  68892   int8x8_t __ret;
  68893   __ret = __p0 + vabd_s8(__p1, __p2);
  68894   return __ret;
  68895 }
  68896 #else
  68897 __ai __attribute__((target("neon"))) int8x8_t vaba_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  68898   int8x8_t __ret;
  68899   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68900   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  68901   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  68902   __ret = __rev0 + __noswap_vabd_s8(__rev1, __rev2);
  68903   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  68904   return __ret;
  68905 }
  68906 #endif
  68907 
  68908 #ifdef __LITTLE_ENDIAN__
  68909 __ai __attribute__((target("neon"))) int32x2_t vaba_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  68910   int32x2_t __ret;
  68911   __ret = __p0 + vabd_s32(__p1, __p2);
  68912   return __ret;
  68913 }
  68914 #else
  68915 __ai __attribute__((target("neon"))) int32x2_t vaba_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  68916   int32x2_t __ret;
  68917   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68918   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  68919   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  68920   __ret = __rev0 + __noswap_vabd_s32(__rev1, __rev2);
  68921   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68922   return __ret;
  68923 }
  68924 #endif
  68925 
  68926 #ifdef __LITTLE_ENDIAN__
  68927 __ai __attribute__((target("neon"))) int16x4_t vaba_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  68928   int16x4_t __ret;
  68929   __ret = __p0 + vabd_s16(__p1, __p2);
  68930   return __ret;
  68931 }
  68932 #else
  68933 __ai __attribute__((target("neon"))) int16x4_t vaba_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  68934   int16x4_t __ret;
  68935   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68936   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  68937   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  68938   __ret = __rev0 + __noswap_vabd_s16(__rev1, __rev2);
  68939   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  68940   return __ret;
  68941 }
  68942 #endif
  68943 
  68944 #ifdef __LITTLE_ENDIAN__
  68945 __ai __attribute__((target("neon"))) uint16x8_t vabdl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  68946   uint16x8_t __ret;
  68947   __ret = (uint16x8_t)(vmovl_u8((uint8x8_t)(vabd_u8(__p0, __p1))));
  68948   return __ret;
  68949 }
  68950 #else
  68951 __ai __attribute__((target("neon"))) uint16x8_t vabdl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  68952   uint16x8_t __ret;
  68953   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  68954   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  68955   __ret = (uint16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_u8(__rev0, __rev1))));
  68956   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  68957   return __ret;
  68958 }
  68959 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vabdl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  68960   uint16x8_t __ret;
  68961   __ret = (uint16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_u8(__p0, __p1))));
  68962   return __ret;
  68963 }
  68964 #endif
  68965 
  68966 #ifdef __LITTLE_ENDIAN__
  68967 __ai __attribute__((target("neon"))) uint64x2_t vabdl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  68968   uint64x2_t __ret;
  68969   __ret = (uint64x2_t)(vmovl_u32((uint32x2_t)(vabd_u32(__p0, __p1))));
  68970   return __ret;
  68971 }
  68972 #else
  68973 __ai __attribute__((target("neon"))) uint64x2_t vabdl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  68974   uint64x2_t __ret;
  68975   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  68976   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  68977   __ret = (uint64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_u32(__rev0, __rev1))));
  68978   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  68979   return __ret;
  68980 }
  68981 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vabdl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  68982   uint64x2_t __ret;
  68983   __ret = (uint64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_u32(__p0, __p1))));
  68984   return __ret;
  68985 }
  68986 #endif
  68987 
  68988 #ifdef __LITTLE_ENDIAN__
  68989 __ai __attribute__((target("neon"))) uint32x4_t vabdl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  68990   uint32x4_t __ret;
  68991   __ret = (uint32x4_t)(vmovl_u16((uint16x4_t)(vabd_u16(__p0, __p1))));
  68992   return __ret;
  68993 }
  68994 #else
  68995 __ai __attribute__((target("neon"))) uint32x4_t vabdl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  68996   uint32x4_t __ret;
  68997   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  68998   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  68999   __ret = (uint32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_u16(__rev0, __rev1))));
  69000   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69001   return __ret;
  69002 }
  69003 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vabdl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  69004   uint32x4_t __ret;
  69005   __ret = (uint32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_u16(__p0, __p1))));
  69006   return __ret;
  69007 }
  69008 #endif
  69009 
  69010 #ifdef __LITTLE_ENDIAN__
  69011 __ai __attribute__((target("neon"))) int16x8_t vabdl_s8(int8x8_t __p0, int8x8_t __p1) {
  69012   int16x8_t __ret;
  69013   __ret = (int16x8_t)(vmovl_u8((uint8x8_t)(vabd_s8(__p0, __p1))));
  69014   return __ret;
  69015 }
  69016 #else
  69017 __ai __attribute__((target("neon"))) int16x8_t vabdl_s8(int8x8_t __p0, int8x8_t __p1) {
  69018   int16x8_t __ret;
  69019   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69020   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69021   __ret = (int16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_s8(__rev0, __rev1))));
  69022   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69023   return __ret;
  69024 }
  69025 __ai __attribute__((target("neon"))) int16x8_t __noswap_vabdl_s8(int8x8_t __p0, int8x8_t __p1) {
  69026   int16x8_t __ret;
  69027   __ret = (int16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_s8(__p0, __p1))));
  69028   return __ret;
  69029 }
  69030 #endif
  69031 
  69032 #ifdef __LITTLE_ENDIAN__
  69033 __ai __attribute__((target("neon"))) int64x2_t vabdl_s32(int32x2_t __p0, int32x2_t __p1) {
  69034   int64x2_t __ret;
  69035   __ret = (int64x2_t)(vmovl_u32((uint32x2_t)(vabd_s32(__p0, __p1))));
  69036   return __ret;
  69037 }
  69038 #else
  69039 __ai __attribute__((target("neon"))) int64x2_t vabdl_s32(int32x2_t __p0, int32x2_t __p1) {
  69040   int64x2_t __ret;
  69041   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69042   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69043   __ret = (int64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_s32(__rev0, __rev1))));
  69044   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69045   return __ret;
  69046 }
  69047 __ai __attribute__((target("neon"))) int64x2_t __noswap_vabdl_s32(int32x2_t __p0, int32x2_t __p1) {
  69048   int64x2_t __ret;
  69049   __ret = (int64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_s32(__p0, __p1))));
  69050   return __ret;
  69051 }
  69052 #endif
  69053 
  69054 #ifdef __LITTLE_ENDIAN__
  69055 __ai __attribute__((target("neon"))) int32x4_t vabdl_s16(int16x4_t __p0, int16x4_t __p1) {
  69056   int32x4_t __ret;
  69057   __ret = (int32x4_t)(vmovl_u16((uint16x4_t)(vabd_s16(__p0, __p1))));
  69058   return __ret;
  69059 }
  69060 #else
  69061 __ai __attribute__((target("neon"))) int32x4_t vabdl_s16(int16x4_t __p0, int16x4_t __p1) {
  69062   int32x4_t __ret;
  69063   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69064   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69065   __ret = (int32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_s16(__rev0, __rev1))));
  69066   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69067   return __ret;
  69068 }
  69069 __ai __attribute__((target("neon"))) int32x4_t __noswap_vabdl_s16(int16x4_t __p0, int16x4_t __p1) {
  69070   int32x4_t __ret;
  69071   __ret = (int32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_s16(__p0, __p1))));
  69072   return __ret;
  69073 }
  69074 #endif
  69075 
  69076 #ifdef __LITTLE_ENDIAN__
  69077 __ai __attribute__((target("neon"))) uint16x8_t vaddl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  69078   uint16x8_t __ret;
  69079   __ret = vmovl_u8(__p0) + vmovl_u8(__p1);
  69080   return __ret;
  69081 }
  69082 #else
  69083 __ai __attribute__((target("neon"))) uint16x8_t vaddl_u8(uint8x8_t __p0, uint8x8_t __p1) {
  69084   uint16x8_t __ret;
  69085   uint8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69086   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69087   __ret = __noswap_vmovl_u8(__rev0) + __noswap_vmovl_u8(__rev1);
  69088   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69089   return __ret;
  69090 }
  69091 #endif
  69092 
  69093 #ifdef __LITTLE_ENDIAN__
  69094 __ai __attribute__((target("neon"))) uint64x2_t vaddl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  69095   uint64x2_t __ret;
  69096   __ret = vmovl_u32(__p0) + vmovl_u32(__p1);
  69097   return __ret;
  69098 }
  69099 #else
  69100 __ai __attribute__((target("neon"))) uint64x2_t vaddl_u32(uint32x2_t __p0, uint32x2_t __p1) {
  69101   uint64x2_t __ret;
  69102   uint32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69103   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69104   __ret = __noswap_vmovl_u32(__rev0) + __noswap_vmovl_u32(__rev1);
  69105   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69106   return __ret;
  69107 }
  69108 #endif
  69109 
  69110 #ifdef __LITTLE_ENDIAN__
  69111 __ai __attribute__((target("neon"))) uint32x4_t vaddl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  69112   uint32x4_t __ret;
  69113   __ret = vmovl_u16(__p0) + vmovl_u16(__p1);
  69114   return __ret;
  69115 }
  69116 #else
  69117 __ai __attribute__((target("neon"))) uint32x4_t vaddl_u16(uint16x4_t __p0, uint16x4_t __p1) {
  69118   uint32x4_t __ret;
  69119   uint16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69120   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69121   __ret = __noswap_vmovl_u16(__rev0) + __noswap_vmovl_u16(__rev1);
  69122   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69123   return __ret;
  69124 }
  69125 #endif
  69126 
  69127 #ifdef __LITTLE_ENDIAN__
  69128 __ai __attribute__((target("neon"))) int16x8_t vaddl_s8(int8x8_t __p0, int8x8_t __p1) {
  69129   int16x8_t __ret;
  69130   __ret = vmovl_s8(__p0) + vmovl_s8(__p1);
  69131   return __ret;
  69132 }
  69133 #else
  69134 __ai __attribute__((target("neon"))) int16x8_t vaddl_s8(int8x8_t __p0, int8x8_t __p1) {
  69135   int16x8_t __ret;
  69136   int8x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69137   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69138   __ret = __noswap_vmovl_s8(__rev0) + __noswap_vmovl_s8(__rev1);
  69139   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69140   return __ret;
  69141 }
  69142 #endif
  69143 
  69144 #ifdef __LITTLE_ENDIAN__
  69145 __ai __attribute__((target("neon"))) int64x2_t vaddl_s32(int32x2_t __p0, int32x2_t __p1) {
  69146   int64x2_t __ret;
  69147   __ret = vmovl_s32(__p0) + vmovl_s32(__p1);
  69148   return __ret;
  69149 }
  69150 #else
  69151 __ai __attribute__((target("neon"))) int64x2_t vaddl_s32(int32x2_t __p0, int32x2_t __p1) {
  69152   int64x2_t __ret;
  69153   int32x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69154   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69155   __ret = __noswap_vmovl_s32(__rev0) + __noswap_vmovl_s32(__rev1);
  69156   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69157   return __ret;
  69158 }
  69159 #endif
  69160 
  69161 #ifdef __LITTLE_ENDIAN__
  69162 __ai __attribute__((target("neon"))) int32x4_t vaddl_s16(int16x4_t __p0, int16x4_t __p1) {
  69163   int32x4_t __ret;
  69164   __ret = vmovl_s16(__p0) + vmovl_s16(__p1);
  69165   return __ret;
  69166 }
  69167 #else
  69168 __ai __attribute__((target("neon"))) int32x4_t vaddl_s16(int16x4_t __p0, int16x4_t __p1) {
  69169   int32x4_t __ret;
  69170   int16x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69171   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69172   __ret = __noswap_vmovl_s16(__rev0) + __noswap_vmovl_s16(__rev1);
  69173   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69174   return __ret;
  69175 }
  69176 #endif
  69177 
  69178 #ifdef __LITTLE_ENDIAN__
  69179 __ai __attribute__((target("neon"))) uint16x8_t vaddw_u8(uint16x8_t __p0, uint8x8_t __p1) {
  69180   uint16x8_t __ret;
  69181   __ret = __p0 + vmovl_u8(__p1);
  69182   return __ret;
  69183 }
  69184 #else
  69185 __ai __attribute__((target("neon"))) uint16x8_t vaddw_u8(uint16x8_t __p0, uint8x8_t __p1) {
  69186   uint16x8_t __ret;
  69187   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69188   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69189   __ret = __rev0 + __noswap_vmovl_u8(__rev1);
  69190   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69191   return __ret;
  69192 }
  69193 #endif
  69194 
  69195 #ifdef __LITTLE_ENDIAN__
  69196 __ai __attribute__((target("neon"))) uint64x2_t vaddw_u32(uint64x2_t __p0, uint32x2_t __p1) {
  69197   uint64x2_t __ret;
  69198   __ret = __p0 + vmovl_u32(__p1);
  69199   return __ret;
  69200 }
  69201 #else
  69202 __ai __attribute__((target("neon"))) uint64x2_t vaddw_u32(uint64x2_t __p0, uint32x2_t __p1) {
  69203   uint64x2_t __ret;
  69204   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69205   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69206   __ret = __rev0 + __noswap_vmovl_u32(__rev1);
  69207   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69208   return __ret;
  69209 }
  69210 #endif
  69211 
  69212 #ifdef __LITTLE_ENDIAN__
  69213 __ai __attribute__((target("neon"))) uint32x4_t vaddw_u16(uint32x4_t __p0, uint16x4_t __p1) {
  69214   uint32x4_t __ret;
  69215   __ret = __p0 + vmovl_u16(__p1);
  69216   return __ret;
  69217 }
  69218 #else
  69219 __ai __attribute__((target("neon"))) uint32x4_t vaddw_u16(uint32x4_t __p0, uint16x4_t __p1) {
  69220   uint32x4_t __ret;
  69221   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69222   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69223   __ret = __rev0 + __noswap_vmovl_u16(__rev1);
  69224   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69225   return __ret;
  69226 }
  69227 #endif
  69228 
  69229 #ifdef __LITTLE_ENDIAN__
  69230 __ai __attribute__((target("neon"))) int16x8_t vaddw_s8(int16x8_t __p0, int8x8_t __p1) {
  69231   int16x8_t __ret;
  69232   __ret = __p0 + vmovl_s8(__p1);
  69233   return __ret;
  69234 }
  69235 #else
  69236 __ai __attribute__((target("neon"))) int16x8_t vaddw_s8(int16x8_t __p0, int8x8_t __p1) {
  69237   int16x8_t __ret;
  69238   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69239   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69240   __ret = __rev0 + __noswap_vmovl_s8(__rev1);
  69241   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69242   return __ret;
  69243 }
  69244 #endif
  69245 
  69246 #ifdef __LITTLE_ENDIAN__
  69247 __ai __attribute__((target("neon"))) int64x2_t vaddw_s32(int64x2_t __p0, int32x2_t __p1) {
  69248   int64x2_t __ret;
  69249   __ret = __p0 + vmovl_s32(__p1);
  69250   return __ret;
  69251 }
  69252 #else
  69253 __ai __attribute__((target("neon"))) int64x2_t vaddw_s32(int64x2_t __p0, int32x2_t __p1) {
  69254   int64x2_t __ret;
  69255   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69256   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69257   __ret = __rev0 + __noswap_vmovl_s32(__rev1);
  69258   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69259   return __ret;
  69260 }
  69261 #endif
  69262 
  69263 #ifdef __LITTLE_ENDIAN__
  69264 __ai __attribute__((target("neon"))) int32x4_t vaddw_s16(int32x4_t __p0, int16x4_t __p1) {
  69265   int32x4_t __ret;
  69266   __ret = __p0 + vmovl_s16(__p1);
  69267   return __ret;
  69268 }
  69269 #else
  69270 __ai __attribute__((target("neon"))) int32x4_t vaddw_s16(int32x4_t __p0, int16x4_t __p1) {
  69271   int32x4_t __ret;
  69272   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69273   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69274   __ret = __rev0 + __noswap_vmovl_s16(__rev1);
  69275   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69276   return __ret;
  69277 }
  69278 #endif
  69279 
  69280 #ifdef __LITTLE_ENDIAN__
  69281 #define vget_lane_f16(__p0_831, __p1_831) __extension__ ({ \
  69282   float16_t __ret_831; \
  69283   float16x4_t __s0_831 = __p0_831; \
  69284   __ret_831 = __builtin_bit_cast(float16_t, vget_lane_s16(__builtin_bit_cast(int16x4_t, __s0_831), __p1_831)); \
  69285   __ret_831; \
  69286 })
  69287 #else
  69288 #define vget_lane_f16(__p0_832, __p1_832) __extension__ ({ \
  69289   float16_t __ret_832; \
  69290   float16x4_t __s0_832 = __p0_832; \
  69291   float16x4_t __rev0_832;  __rev0_832 = __builtin_shufflevector(__s0_832, __s0_832, 3, 2, 1, 0); \
  69292   __ret_832 = __builtin_bit_cast(float16_t, __noswap_vget_lane_s16(__builtin_bit_cast(int16x4_t, __rev0_832), __p1_832)); \
  69293   __ret_832; \
  69294 })
  69295 #define __noswap_vget_lane_f16(__p0_833, __p1_833) __extension__ ({ \
  69296   float16_t __ret_833; \
  69297   float16x4_t __s0_833 = __p0_833; \
  69298   __ret_833 = __builtin_bit_cast(float16_t, __noswap_vget_lane_s16(__builtin_bit_cast(int16x4_t, __s0_833), __p1_833)); \
  69299   __ret_833; \
  69300 })
  69301 #endif
  69302 
  69303 #ifdef __LITTLE_ENDIAN__
  69304 #define vgetq_lane_f16(__p0_834, __p1_834) __extension__ ({ \
  69305   float16_t __ret_834; \
  69306   float16x8_t __s0_834 = __p0_834; \
  69307   __ret_834 = __builtin_bit_cast(float16_t, vgetq_lane_s16(__builtin_bit_cast(int16x8_t, __s0_834), __p1_834)); \
  69308   __ret_834; \
  69309 })
  69310 #else
  69311 #define vgetq_lane_f16(__p0_835, __p1_835) __extension__ ({ \
  69312   float16_t __ret_835; \
  69313   float16x8_t __s0_835 = __p0_835; \
  69314   float16x8_t __rev0_835;  __rev0_835 = __builtin_shufflevector(__s0_835, __s0_835, 7, 6, 5, 4, 3, 2, 1, 0); \
  69315   __ret_835 = __builtin_bit_cast(float16_t, __noswap_vgetq_lane_s16(__builtin_bit_cast(int16x8_t, __rev0_835), __p1_835)); \
  69316   __ret_835; \
  69317 })
  69318 #define __noswap_vgetq_lane_f16(__p0_836, __p1_836) __extension__ ({ \
  69319   float16_t __ret_836; \
  69320   float16x8_t __s0_836 = __p0_836; \
  69321   __ret_836 = __builtin_bit_cast(float16_t, __noswap_vgetq_lane_s16(__builtin_bit_cast(int16x8_t, __s0_836), __p1_836)); \
  69322   __ret_836; \
  69323 })
  69324 #endif
  69325 
  69326 #ifdef __LITTLE_ENDIAN__
  69327 __ai __attribute__((target("neon"))) uint16x8_t vmlal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  69328   uint16x8_t __ret;
  69329   __ret = __p0 + vmull_u8(__p1, __p2);
  69330   return __ret;
  69331 }
  69332 #else
  69333 __ai __attribute__((target("neon"))) uint16x8_t vmlal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  69334   uint16x8_t __ret;
  69335   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69336   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69337   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  69338   __ret = __rev0 + __noswap_vmull_u8(__rev1, __rev2);
  69339   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69340   return __ret;
  69341 }
  69342 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmlal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  69343   uint16x8_t __ret;
  69344   __ret = __p0 + __noswap_vmull_u8(__p1, __p2);
  69345   return __ret;
  69346 }
  69347 #endif
  69348 
  69349 #ifdef __LITTLE_ENDIAN__
  69350 __ai __attribute__((target("neon"))) uint64x2_t vmlal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  69351   uint64x2_t __ret;
  69352   __ret = __p0 + vmull_u32(__p1, __p2);
  69353   return __ret;
  69354 }
  69355 #else
  69356 __ai __attribute__((target("neon"))) uint64x2_t vmlal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  69357   uint64x2_t __ret;
  69358   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69359   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69360   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  69361   __ret = __rev0 + __noswap_vmull_u32(__rev1, __rev2);
  69362   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69363   return __ret;
  69364 }
  69365 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  69366   uint64x2_t __ret;
  69367   __ret = __p0 + __noswap_vmull_u32(__p1, __p2);
  69368   return __ret;
  69369 }
  69370 #endif
  69371 
  69372 #ifdef __LITTLE_ENDIAN__
  69373 __ai __attribute__((target("neon"))) uint32x4_t vmlal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  69374   uint32x4_t __ret;
  69375   __ret = __p0 + vmull_u16(__p1, __p2);
  69376   return __ret;
  69377 }
  69378 #else
  69379 __ai __attribute__((target("neon"))) uint32x4_t vmlal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  69380   uint32x4_t __ret;
  69381   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69382   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69383   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  69384   __ret = __rev0 + __noswap_vmull_u16(__rev1, __rev2);
  69385   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69386   return __ret;
  69387 }
  69388 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  69389   uint32x4_t __ret;
  69390   __ret = __p0 + __noswap_vmull_u16(__p1, __p2);
  69391   return __ret;
  69392 }
  69393 #endif
  69394 
  69395 #ifdef __LITTLE_ENDIAN__
  69396 __ai __attribute__((target("neon"))) int16x8_t vmlal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  69397   int16x8_t __ret;
  69398   __ret = __p0 + vmull_s8(__p1, __p2);
  69399   return __ret;
  69400 }
  69401 #else
  69402 __ai __attribute__((target("neon"))) int16x8_t vmlal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  69403   int16x8_t __ret;
  69404   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69405   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69406   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  69407   __ret = __rev0 + __noswap_vmull_s8(__rev1, __rev2);
  69408   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69409   return __ret;
  69410 }
  69411 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmlal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  69412   int16x8_t __ret;
  69413   __ret = __p0 + __noswap_vmull_s8(__p1, __p2);
  69414   return __ret;
  69415 }
  69416 #endif
  69417 
  69418 #ifdef __LITTLE_ENDIAN__
  69419 __ai __attribute__((target("neon"))) int64x2_t vmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  69420   int64x2_t __ret;
  69421   __ret = __p0 + vmull_s32(__p1, __p2);
  69422   return __ret;
  69423 }
  69424 #else
  69425 __ai __attribute__((target("neon"))) int64x2_t vmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  69426   int64x2_t __ret;
  69427   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69428   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69429   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  69430   __ret = __rev0 + __noswap_vmull_s32(__rev1, __rev2);
  69431   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69432   return __ret;
  69433 }
  69434 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  69435   int64x2_t __ret;
  69436   __ret = __p0 + __noswap_vmull_s32(__p1, __p2);
  69437   return __ret;
  69438 }
  69439 #endif
  69440 
  69441 #ifdef __LITTLE_ENDIAN__
  69442 __ai __attribute__((target("neon"))) int32x4_t vmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  69443   int32x4_t __ret;
  69444   __ret = __p0 + vmull_s16(__p1, __p2);
  69445   return __ret;
  69446 }
  69447 #else
  69448 __ai __attribute__((target("neon"))) int32x4_t vmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  69449   int32x4_t __ret;
  69450   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69451   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69452   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  69453   __ret = __rev0 + __noswap_vmull_s16(__rev1, __rev2);
  69454   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69455   return __ret;
  69456 }
  69457 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  69458   int32x4_t __ret;
  69459   __ret = __p0 + __noswap_vmull_s16(__p1, __p2);
  69460   return __ret;
  69461 }
  69462 #endif
  69463 
  69464 #ifdef __LITTLE_ENDIAN__
  69465 #define vmlal_lane_u32(__p0_837, __p1_837, __p2_837, __p3_837) __extension__ ({ \
  69466   uint64x2_t __ret_837; \
  69467   uint64x2_t __s0_837 = __p0_837; \
  69468   uint32x2_t __s1_837 = __p1_837; \
  69469   uint32x2_t __s2_837 = __p2_837; \
  69470   __ret_837 = __s0_837 + vmull_u32(__s1_837, splat_lane_u32(__s2_837, __p3_837)); \
  69471   __ret_837; \
  69472 })
  69473 #else
  69474 #define vmlal_lane_u32(__p0_838, __p1_838, __p2_838, __p3_838) __extension__ ({ \
  69475   uint64x2_t __ret_838; \
  69476   uint64x2_t __s0_838 = __p0_838; \
  69477   uint32x2_t __s1_838 = __p1_838; \
  69478   uint32x2_t __s2_838 = __p2_838; \
  69479   uint64x2_t __rev0_838;  __rev0_838 = __builtin_shufflevector(__s0_838, __s0_838, 1, 0); \
  69480   uint32x2_t __rev1_838;  __rev1_838 = __builtin_shufflevector(__s1_838, __s1_838, 1, 0); \
  69481   uint32x2_t __rev2_838;  __rev2_838 = __builtin_shufflevector(__s2_838, __s2_838, 1, 0); \
  69482   __ret_838 = __rev0_838 + __noswap_vmull_u32(__rev1_838, __noswap_splat_lane_u32(__rev2_838, __p3_838)); \
  69483   __ret_838 = __builtin_shufflevector(__ret_838, __ret_838, 1, 0); \
  69484   __ret_838; \
  69485 })
  69486 #endif
  69487 
  69488 #ifdef __LITTLE_ENDIAN__
  69489 #define vmlal_lane_u16(__p0_839, __p1_839, __p2_839, __p3_839) __extension__ ({ \
  69490   uint32x4_t __ret_839; \
  69491   uint32x4_t __s0_839 = __p0_839; \
  69492   uint16x4_t __s1_839 = __p1_839; \
  69493   uint16x4_t __s2_839 = __p2_839; \
  69494   __ret_839 = __s0_839 + vmull_u16(__s1_839, splat_lane_u16(__s2_839, __p3_839)); \
  69495   __ret_839; \
  69496 })
  69497 #else
  69498 #define vmlal_lane_u16(__p0_840, __p1_840, __p2_840, __p3_840) __extension__ ({ \
  69499   uint32x4_t __ret_840; \
  69500   uint32x4_t __s0_840 = __p0_840; \
  69501   uint16x4_t __s1_840 = __p1_840; \
  69502   uint16x4_t __s2_840 = __p2_840; \
  69503   uint32x4_t __rev0_840;  __rev0_840 = __builtin_shufflevector(__s0_840, __s0_840, 3, 2, 1, 0); \
  69504   uint16x4_t __rev1_840;  __rev1_840 = __builtin_shufflevector(__s1_840, __s1_840, 3, 2, 1, 0); \
  69505   uint16x4_t __rev2_840;  __rev2_840 = __builtin_shufflevector(__s2_840, __s2_840, 3, 2, 1, 0); \
  69506   __ret_840 = __rev0_840 + __noswap_vmull_u16(__rev1_840, __noswap_splat_lane_u16(__rev2_840, __p3_840)); \
  69507   __ret_840 = __builtin_shufflevector(__ret_840, __ret_840, 3, 2, 1, 0); \
  69508   __ret_840; \
  69509 })
  69510 #endif
  69511 
  69512 #ifdef __LITTLE_ENDIAN__
  69513 #define vmlal_lane_s32(__p0_841, __p1_841, __p2_841, __p3_841) __extension__ ({ \
  69514   int64x2_t __ret_841; \
  69515   int64x2_t __s0_841 = __p0_841; \
  69516   int32x2_t __s1_841 = __p1_841; \
  69517   int32x2_t __s2_841 = __p2_841; \
  69518   __ret_841 = __s0_841 + vmull_s32(__s1_841, splat_lane_s32(__s2_841, __p3_841)); \
  69519   __ret_841; \
  69520 })
  69521 #else
  69522 #define vmlal_lane_s32(__p0_842, __p1_842, __p2_842, __p3_842) __extension__ ({ \
  69523   int64x2_t __ret_842; \
  69524   int64x2_t __s0_842 = __p0_842; \
  69525   int32x2_t __s1_842 = __p1_842; \
  69526   int32x2_t __s2_842 = __p2_842; \
  69527   int64x2_t __rev0_842;  __rev0_842 = __builtin_shufflevector(__s0_842, __s0_842, 1, 0); \
  69528   int32x2_t __rev1_842;  __rev1_842 = __builtin_shufflevector(__s1_842, __s1_842, 1, 0); \
  69529   int32x2_t __rev2_842;  __rev2_842 = __builtin_shufflevector(__s2_842, __s2_842, 1, 0); \
  69530   __ret_842 = __rev0_842 + __noswap_vmull_s32(__rev1_842, __noswap_splat_lane_s32(__rev2_842, __p3_842)); \
  69531   __ret_842 = __builtin_shufflevector(__ret_842, __ret_842, 1, 0); \
  69532   __ret_842; \
  69533 })
  69534 #endif
  69535 
  69536 #ifdef __LITTLE_ENDIAN__
  69537 #define vmlal_lane_s16(__p0_843, __p1_843, __p2_843, __p3_843) __extension__ ({ \
  69538   int32x4_t __ret_843; \
  69539   int32x4_t __s0_843 = __p0_843; \
  69540   int16x4_t __s1_843 = __p1_843; \
  69541   int16x4_t __s2_843 = __p2_843; \
  69542   __ret_843 = __s0_843 + vmull_s16(__s1_843, splat_lane_s16(__s2_843, __p3_843)); \
  69543   __ret_843; \
  69544 })
  69545 #else
  69546 #define vmlal_lane_s16(__p0_844, __p1_844, __p2_844, __p3_844) __extension__ ({ \
  69547   int32x4_t __ret_844; \
  69548   int32x4_t __s0_844 = __p0_844; \
  69549   int16x4_t __s1_844 = __p1_844; \
  69550   int16x4_t __s2_844 = __p2_844; \
  69551   int32x4_t __rev0_844;  __rev0_844 = __builtin_shufflevector(__s0_844, __s0_844, 3, 2, 1, 0); \
  69552   int16x4_t __rev1_844;  __rev1_844 = __builtin_shufflevector(__s1_844, __s1_844, 3, 2, 1, 0); \
  69553   int16x4_t __rev2_844;  __rev2_844 = __builtin_shufflevector(__s2_844, __s2_844, 3, 2, 1, 0); \
  69554   __ret_844 = __rev0_844 + __noswap_vmull_s16(__rev1_844, __noswap_splat_lane_s16(__rev2_844, __p3_844)); \
  69555   __ret_844 = __builtin_shufflevector(__ret_844, __ret_844, 3, 2, 1, 0); \
  69556   __ret_844; \
  69557 })
  69558 #endif
  69559 
  69560 #ifdef __LITTLE_ENDIAN__
  69561 __ai __attribute__((target("neon"))) uint64x2_t vmlal_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  69562   uint64x2_t __ret;
  69563   __ret = __p0 + vmull_u32(__p1, (uint32x2_t) {__p2, __p2});
  69564   return __ret;
  69565 }
  69566 #else
  69567 __ai __attribute__((target("neon"))) uint64x2_t vmlal_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  69568   uint64x2_t __ret;
  69569   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69570   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69571   __ret = __rev0 + __noswap_vmull_u32(__rev1, (uint32x2_t) {__p2, __p2});
  69572   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69573   return __ret;
  69574 }
  69575 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlal_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  69576   uint64x2_t __ret;
  69577   __ret = __p0 + __noswap_vmull_u32(__p1, (uint32x2_t) {__p2, __p2});
  69578   return __ret;
  69579 }
  69580 #endif
  69581 
  69582 #ifdef __LITTLE_ENDIAN__
  69583 __ai __attribute__((target("neon"))) uint32x4_t vmlal_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  69584   uint32x4_t __ret;
  69585   __ret = __p0 + vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2});
  69586   return __ret;
  69587 }
  69588 #else
  69589 __ai __attribute__((target("neon"))) uint32x4_t vmlal_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  69590   uint32x4_t __ret;
  69591   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69592   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69593   __ret = __rev0 + __noswap_vmull_u16(__rev1, (uint16x4_t) {__p2, __p2, __p2, __p2});
  69594   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69595   return __ret;
  69596 }
  69597 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlal_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  69598   uint32x4_t __ret;
  69599   __ret = __p0 + __noswap_vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2});
  69600   return __ret;
  69601 }
  69602 #endif
  69603 
  69604 #ifdef __LITTLE_ENDIAN__
  69605 __ai __attribute__((target("neon"))) int64x2_t vmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  69606   int64x2_t __ret;
  69607   __ret = __p0 + vmull_s32(__p1, (int32x2_t) {__p2, __p2});
  69608   return __ret;
  69609 }
  69610 #else
  69611 __ai __attribute__((target("neon"))) int64x2_t vmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  69612   int64x2_t __ret;
  69613   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69614   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69615   __ret = __rev0 + __noswap_vmull_s32(__rev1, (int32x2_t) {__p2, __p2});
  69616   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69617   return __ret;
  69618 }
  69619 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  69620   int64x2_t __ret;
  69621   __ret = __p0 + __noswap_vmull_s32(__p1, (int32x2_t) {__p2, __p2});
  69622   return __ret;
  69623 }
  69624 #endif
  69625 
  69626 #ifdef __LITTLE_ENDIAN__
  69627 __ai __attribute__((target("neon"))) int32x4_t vmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  69628   int32x4_t __ret;
  69629   __ret = __p0 + vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  69630   return __ret;
  69631 }
  69632 #else
  69633 __ai __attribute__((target("neon"))) int32x4_t vmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  69634   int32x4_t __ret;
  69635   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69636   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69637   __ret = __rev0 + __noswap_vmull_s16(__rev1, (int16x4_t) {__p2, __p2, __p2, __p2});
  69638   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69639   return __ret;
  69640 }
  69641 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  69642   int32x4_t __ret;
  69643   __ret = __p0 + __noswap_vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  69644   return __ret;
  69645 }
  69646 #endif
  69647 
  69648 #ifdef __LITTLE_ENDIAN__
  69649 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  69650   uint16x8_t __ret;
  69651   __ret = __p0 - vmull_u8(__p1, __p2);
  69652   return __ret;
  69653 }
  69654 #else
  69655 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  69656   uint16x8_t __ret;
  69657   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69658   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69659   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  69660   __ret = __rev0 - __noswap_vmull_u8(__rev1, __rev2);
  69661   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69662   return __ret;
  69663 }
  69664 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmlsl_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  69665   uint16x8_t __ret;
  69666   __ret = __p0 - __noswap_vmull_u8(__p1, __p2);
  69667   return __ret;
  69668 }
  69669 #endif
  69670 
  69671 #ifdef __LITTLE_ENDIAN__
  69672 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  69673   uint64x2_t __ret;
  69674   __ret = __p0 - vmull_u32(__p1, __p2);
  69675   return __ret;
  69676 }
  69677 #else
  69678 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  69679   uint64x2_t __ret;
  69680   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69681   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69682   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  69683   __ret = __rev0 - __noswap_vmull_u32(__rev1, __rev2);
  69684   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69685   return __ret;
  69686 }
  69687 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlsl_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  69688   uint64x2_t __ret;
  69689   __ret = __p0 - __noswap_vmull_u32(__p1, __p2);
  69690   return __ret;
  69691 }
  69692 #endif
  69693 
  69694 #ifdef __LITTLE_ENDIAN__
  69695 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  69696   uint32x4_t __ret;
  69697   __ret = __p0 - vmull_u16(__p1, __p2);
  69698   return __ret;
  69699 }
  69700 #else
  69701 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  69702   uint32x4_t __ret;
  69703   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69704   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69705   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  69706   __ret = __rev0 - __noswap_vmull_u16(__rev1, __rev2);
  69707   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69708   return __ret;
  69709 }
  69710 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlsl_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  69711   uint32x4_t __ret;
  69712   __ret = __p0 - __noswap_vmull_u16(__p1, __p2);
  69713   return __ret;
  69714 }
  69715 #endif
  69716 
  69717 #ifdef __LITTLE_ENDIAN__
  69718 __ai __attribute__((target("neon"))) int16x8_t vmlsl_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  69719   int16x8_t __ret;
  69720   __ret = __p0 - vmull_s8(__p1, __p2);
  69721   return __ret;
  69722 }
  69723 #else
  69724 __ai __attribute__((target("neon"))) int16x8_t vmlsl_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  69725   int16x8_t __ret;
  69726   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  69727   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  69728   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  69729   __ret = __rev0 - __noswap_vmull_s8(__rev1, __rev2);
  69730   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  69731   return __ret;
  69732 }
  69733 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmlsl_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  69734   int16x8_t __ret;
  69735   __ret = __p0 - __noswap_vmull_s8(__p1, __p2);
  69736   return __ret;
  69737 }
  69738 #endif
  69739 
  69740 #ifdef __LITTLE_ENDIAN__
  69741 __ai __attribute__((target("neon"))) int64x2_t vmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  69742   int64x2_t __ret;
  69743   __ret = __p0 - vmull_s32(__p1, __p2);
  69744   return __ret;
  69745 }
  69746 #else
  69747 __ai __attribute__((target("neon"))) int64x2_t vmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  69748   int64x2_t __ret;
  69749   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69750   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69751   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  69752   __ret = __rev0 - __noswap_vmull_s32(__rev1, __rev2);
  69753   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69754   return __ret;
  69755 }
  69756 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  69757   int64x2_t __ret;
  69758   __ret = __p0 - __noswap_vmull_s32(__p1, __p2);
  69759   return __ret;
  69760 }
  69761 #endif
  69762 
  69763 #ifdef __LITTLE_ENDIAN__
  69764 __ai __attribute__((target("neon"))) int32x4_t vmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  69765   int32x4_t __ret;
  69766   __ret = __p0 - vmull_s16(__p1, __p2);
  69767   return __ret;
  69768 }
  69769 #else
  69770 __ai __attribute__((target("neon"))) int32x4_t vmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  69771   int32x4_t __ret;
  69772   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69773   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69774   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  69775   __ret = __rev0 - __noswap_vmull_s16(__rev1, __rev2);
  69776   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69777   return __ret;
  69778 }
  69779 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  69780   int32x4_t __ret;
  69781   __ret = __p0 - __noswap_vmull_s16(__p1, __p2);
  69782   return __ret;
  69783 }
  69784 #endif
  69785 
  69786 #ifdef __LITTLE_ENDIAN__
  69787 #define vmlsl_lane_u32(__p0_845, __p1_845, __p2_845, __p3_845) __extension__ ({ \
  69788   uint64x2_t __ret_845; \
  69789   uint64x2_t __s0_845 = __p0_845; \
  69790   uint32x2_t __s1_845 = __p1_845; \
  69791   uint32x2_t __s2_845 = __p2_845; \
  69792   __ret_845 = __s0_845 - vmull_u32(__s1_845, splat_lane_u32(__s2_845, __p3_845)); \
  69793   __ret_845; \
  69794 })
  69795 #else
  69796 #define vmlsl_lane_u32(__p0_846, __p1_846, __p2_846, __p3_846) __extension__ ({ \
  69797   uint64x2_t __ret_846; \
  69798   uint64x2_t __s0_846 = __p0_846; \
  69799   uint32x2_t __s1_846 = __p1_846; \
  69800   uint32x2_t __s2_846 = __p2_846; \
  69801   uint64x2_t __rev0_846;  __rev0_846 = __builtin_shufflevector(__s0_846, __s0_846, 1, 0); \
  69802   uint32x2_t __rev1_846;  __rev1_846 = __builtin_shufflevector(__s1_846, __s1_846, 1, 0); \
  69803   uint32x2_t __rev2_846;  __rev2_846 = __builtin_shufflevector(__s2_846, __s2_846, 1, 0); \
  69804   __ret_846 = __rev0_846 - __noswap_vmull_u32(__rev1_846, __noswap_splat_lane_u32(__rev2_846, __p3_846)); \
  69805   __ret_846 = __builtin_shufflevector(__ret_846, __ret_846, 1, 0); \
  69806   __ret_846; \
  69807 })
  69808 #endif
  69809 
  69810 #ifdef __LITTLE_ENDIAN__
  69811 #define vmlsl_lane_u16(__p0_847, __p1_847, __p2_847, __p3_847) __extension__ ({ \
  69812   uint32x4_t __ret_847; \
  69813   uint32x4_t __s0_847 = __p0_847; \
  69814   uint16x4_t __s1_847 = __p1_847; \
  69815   uint16x4_t __s2_847 = __p2_847; \
  69816   __ret_847 = __s0_847 - vmull_u16(__s1_847, splat_lane_u16(__s2_847, __p3_847)); \
  69817   __ret_847; \
  69818 })
  69819 #else
  69820 #define vmlsl_lane_u16(__p0_848, __p1_848, __p2_848, __p3_848) __extension__ ({ \
  69821   uint32x4_t __ret_848; \
  69822   uint32x4_t __s0_848 = __p0_848; \
  69823   uint16x4_t __s1_848 = __p1_848; \
  69824   uint16x4_t __s2_848 = __p2_848; \
  69825   uint32x4_t __rev0_848;  __rev0_848 = __builtin_shufflevector(__s0_848, __s0_848, 3, 2, 1, 0); \
  69826   uint16x4_t __rev1_848;  __rev1_848 = __builtin_shufflevector(__s1_848, __s1_848, 3, 2, 1, 0); \
  69827   uint16x4_t __rev2_848;  __rev2_848 = __builtin_shufflevector(__s2_848, __s2_848, 3, 2, 1, 0); \
  69828   __ret_848 = __rev0_848 - __noswap_vmull_u16(__rev1_848, __noswap_splat_lane_u16(__rev2_848, __p3_848)); \
  69829   __ret_848 = __builtin_shufflevector(__ret_848, __ret_848, 3, 2, 1, 0); \
  69830   __ret_848; \
  69831 })
  69832 #endif
  69833 
  69834 #ifdef __LITTLE_ENDIAN__
  69835 #define vmlsl_lane_s32(__p0_849, __p1_849, __p2_849, __p3_849) __extension__ ({ \
  69836   int64x2_t __ret_849; \
  69837   int64x2_t __s0_849 = __p0_849; \
  69838   int32x2_t __s1_849 = __p1_849; \
  69839   int32x2_t __s2_849 = __p2_849; \
  69840   __ret_849 = __s0_849 - vmull_s32(__s1_849, splat_lane_s32(__s2_849, __p3_849)); \
  69841   __ret_849; \
  69842 })
  69843 #else
  69844 #define vmlsl_lane_s32(__p0_850, __p1_850, __p2_850, __p3_850) __extension__ ({ \
  69845   int64x2_t __ret_850; \
  69846   int64x2_t __s0_850 = __p0_850; \
  69847   int32x2_t __s1_850 = __p1_850; \
  69848   int32x2_t __s2_850 = __p2_850; \
  69849   int64x2_t __rev0_850;  __rev0_850 = __builtin_shufflevector(__s0_850, __s0_850, 1, 0); \
  69850   int32x2_t __rev1_850;  __rev1_850 = __builtin_shufflevector(__s1_850, __s1_850, 1, 0); \
  69851   int32x2_t __rev2_850;  __rev2_850 = __builtin_shufflevector(__s2_850, __s2_850, 1, 0); \
  69852   __ret_850 = __rev0_850 - __noswap_vmull_s32(__rev1_850, __noswap_splat_lane_s32(__rev2_850, __p3_850)); \
  69853   __ret_850 = __builtin_shufflevector(__ret_850, __ret_850, 1, 0); \
  69854   __ret_850; \
  69855 })
  69856 #endif
  69857 
  69858 #ifdef __LITTLE_ENDIAN__
  69859 #define vmlsl_lane_s16(__p0_851, __p1_851, __p2_851, __p3_851) __extension__ ({ \
  69860   int32x4_t __ret_851; \
  69861   int32x4_t __s0_851 = __p0_851; \
  69862   int16x4_t __s1_851 = __p1_851; \
  69863   int16x4_t __s2_851 = __p2_851; \
  69864   __ret_851 = __s0_851 - vmull_s16(__s1_851, splat_lane_s16(__s2_851, __p3_851)); \
  69865   __ret_851; \
  69866 })
  69867 #else
  69868 #define vmlsl_lane_s16(__p0_852, __p1_852, __p2_852, __p3_852) __extension__ ({ \
  69869   int32x4_t __ret_852; \
  69870   int32x4_t __s0_852 = __p0_852; \
  69871   int16x4_t __s1_852 = __p1_852; \
  69872   int16x4_t __s2_852 = __p2_852; \
  69873   int32x4_t __rev0_852;  __rev0_852 = __builtin_shufflevector(__s0_852, __s0_852, 3, 2, 1, 0); \
  69874   int16x4_t __rev1_852;  __rev1_852 = __builtin_shufflevector(__s1_852, __s1_852, 3, 2, 1, 0); \
  69875   int16x4_t __rev2_852;  __rev2_852 = __builtin_shufflevector(__s2_852, __s2_852, 3, 2, 1, 0); \
  69876   __ret_852 = __rev0_852 - __noswap_vmull_s16(__rev1_852, __noswap_splat_lane_s16(__rev2_852, __p3_852)); \
  69877   __ret_852 = __builtin_shufflevector(__ret_852, __ret_852, 3, 2, 1, 0); \
  69878   __ret_852; \
  69879 })
  69880 #endif
  69881 
  69882 #ifdef __LITTLE_ENDIAN__
  69883 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  69884   uint64x2_t __ret;
  69885   __ret = __p0 - vmull_u32(__p1, (uint32x2_t) {__p2, __p2});
  69886   return __ret;
  69887 }
  69888 #else
  69889 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  69890   uint64x2_t __ret;
  69891   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69892   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69893   __ret = __rev0 - __noswap_vmull_u32(__rev1, (uint32x2_t) {__p2, __p2});
  69894   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69895   return __ret;
  69896 }
  69897 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlsl_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) {
  69898   uint64x2_t __ret;
  69899   __ret = __p0 - __noswap_vmull_u32(__p1, (uint32x2_t) {__p2, __p2});
  69900   return __ret;
  69901 }
  69902 #endif
  69903 
  69904 #ifdef __LITTLE_ENDIAN__
  69905 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  69906   uint32x4_t __ret;
  69907   __ret = __p0 - vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2});
  69908   return __ret;
  69909 }
  69910 #else
  69911 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  69912   uint32x4_t __ret;
  69913   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69914   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69915   __ret = __rev0 - __noswap_vmull_u16(__rev1, (uint16x4_t) {__p2, __p2, __p2, __p2});
  69916   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69917   return __ret;
  69918 }
  69919 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlsl_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) {
  69920   uint32x4_t __ret;
  69921   __ret = __p0 - __noswap_vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2});
  69922   return __ret;
  69923 }
  69924 #endif
  69925 
  69926 #ifdef __LITTLE_ENDIAN__
  69927 __ai __attribute__((target("neon"))) int64x2_t vmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  69928   int64x2_t __ret;
  69929   __ret = __p0 - vmull_s32(__p1, (int32x2_t) {__p2, __p2});
  69930   return __ret;
  69931 }
  69932 #else
  69933 __ai __attribute__((target("neon"))) int64x2_t vmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  69934   int64x2_t __ret;
  69935   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  69936   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  69937   __ret = __rev0 - __noswap_vmull_s32(__rev1, (int32x2_t) {__p2, __p2});
  69938   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  69939   return __ret;
  69940 }
  69941 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) {
  69942   int64x2_t __ret;
  69943   __ret = __p0 - __noswap_vmull_s32(__p1, (int32x2_t) {__p2, __p2});
  69944   return __ret;
  69945 }
  69946 #endif
  69947 
  69948 #ifdef __LITTLE_ENDIAN__
  69949 __ai __attribute__((target("neon"))) int32x4_t vmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  69950   int32x4_t __ret;
  69951   __ret = __p0 - vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  69952   return __ret;
  69953 }
  69954 #else
  69955 __ai __attribute__((target("neon"))) int32x4_t vmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  69956   int32x4_t __ret;
  69957   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  69958   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  69959   __ret = __rev0 - __noswap_vmull_s16(__rev1, (int16x4_t) {__p2, __p2, __p2, __p2});
  69960   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  69961   return __ret;
  69962 }
  69963 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) {
  69964   int32x4_t __ret;
  69965   __ret = __p0 - __noswap_vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2});
  69966   return __ret;
  69967 }
  69968 #endif
  69969 
  69970 #ifdef __LITTLE_ENDIAN__
  69971 #define vset_lane_f16(__p0_853, __p1_853, __p2_853) __extension__ ({ \
  69972   float16x4_t __ret_853; \
  69973   float16_t __s0_853 = __p0_853; \
  69974   float16x4_t __s1_853 = __p1_853; \
  69975   __ret_853 = __builtin_bit_cast(float16x4_t, vset_lane_s16(__builtin_bit_cast(int16_t, __s0_853), __builtin_bit_cast(int16x4_t, __s1_853), __p2_853)); \
  69976   __ret_853; \
  69977 })
  69978 #else
  69979 #define vset_lane_f16(__p0_854, __p1_854, __p2_854) __extension__ ({ \
  69980   float16x4_t __ret_854; \
  69981   float16_t __s0_854 = __p0_854; \
  69982   float16x4_t __s1_854 = __p1_854; \
  69983   float16x4_t __rev1_854;  __rev1_854 = __builtin_shufflevector(__s1_854, __s1_854, 3, 2, 1, 0); \
  69984   __ret_854 = __builtin_bit_cast(float16x4_t, __noswap_vset_lane_s16(__builtin_bit_cast(int16_t, __s0_854), __builtin_bit_cast(int16x4_t, __rev1_854), __p2_854)); \
  69985   __ret_854 = __builtin_shufflevector(__ret_854, __ret_854, 3, 2, 1, 0); \
  69986   __ret_854; \
  69987 })
  69988 #endif
  69989 
  69990 #ifdef __LITTLE_ENDIAN__
  69991 #define vsetq_lane_f16(__p0_855, __p1_855, __p2_855) __extension__ ({ \
  69992   float16x8_t __ret_855; \
  69993   float16_t __s0_855 = __p0_855; \
  69994   float16x8_t __s1_855 = __p1_855; \
  69995   __ret_855 = __builtin_bit_cast(float16x8_t, vsetq_lane_s16(__builtin_bit_cast(int16_t, __s0_855), __builtin_bit_cast(int16x8_t, __s1_855), __p2_855)); \
  69996   __ret_855; \
  69997 })
  69998 #else
  69999 #define vsetq_lane_f16(__p0_856, __p1_856, __p2_856) __extension__ ({ \
  70000   float16x8_t __ret_856; \
  70001   float16_t __s0_856 = __p0_856; \
  70002   float16x8_t __s1_856 = __p1_856; \
  70003   float16x8_t __rev1_856;  __rev1_856 = __builtin_shufflevector(__s1_856, __s1_856, 7, 6, 5, 4, 3, 2, 1, 0); \
  70004   __ret_856 = __builtin_bit_cast(float16x8_t, __noswap_vsetq_lane_s16(__builtin_bit_cast(int16_t, __s0_856), __builtin_bit_cast(int16x8_t, __rev1_856), __p2_856)); \
  70005   __ret_856 = __builtin_shufflevector(__ret_856, __ret_856, 7, 6, 5, 4, 3, 2, 1, 0); \
  70006   __ret_856; \
  70007 })
  70008 #endif
  70009 
  70010 #if defined(__aarch64__) || defined(__arm64ec__)
  70011 #ifdef __LITTLE_ENDIAN__
  70012 __ai __attribute__((target("aes,neon"))) poly128_t vmull_high_p64(poly64x2_t __p0, poly64x2_t __p1) {
  70013   poly128_t __ret;
  70014   __ret = vmull_p64((poly64_t)(vget_high_p64(__p0)), (poly64_t)(vget_high_p64(__p1)));
  70015   return __ret;
  70016 }
  70017 #else
  70018 __ai __attribute__((target("aes,neon"))) poly128_t vmull_high_p64(poly64x2_t __p0, poly64x2_t __p1) {
  70019   poly128_t __ret;
  70020   poly64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  70021   poly64x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  70022   __ret = vmull_p64((poly64_t)(__noswap_vget_high_p64(__rev0)), (poly64_t)(__noswap_vget_high_p64(__rev1)));
  70023   return __ret;
  70024 }
  70025 #endif
  70026 
  70027 #ifdef __LITTLE_ENDIAN__
  70028 #define vfmlalq_lane_high_f16(__p0_857, __p1_857, __p2_857, __p3_857) __extension__ ({ \
  70029   float32x4_t __ret_857; \
  70030   float32x4_t __s0_857 = __p0_857; \
  70031   float16x8_t __s1_857 = __p1_857; \
  70032   float16x4_t __s2_857 = __p2_857; \
  70033   __ret_857 = vfmlalq_high_f16(__s0_857, __s1_857, (float16x8_t) {vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857)}); \
  70034   __ret_857; \
  70035 })
  70036 #else
  70037 #define vfmlalq_lane_high_f16(__p0_858, __p1_858, __p2_858, __p3_858) __extension__ ({ \
  70038   float32x4_t __ret_858; \
  70039   float32x4_t __s0_858 = __p0_858; \
  70040   float16x8_t __s1_858 = __p1_858; \
  70041   float16x4_t __s2_858 = __p2_858; \
  70042   float32x4_t __rev0_858;  __rev0_858 = __builtin_shufflevector(__s0_858, __s0_858, 3, 2, 1, 0); \
  70043   float16x8_t __rev1_858;  __rev1_858 = __builtin_shufflevector(__s1_858, __s1_858, 7, 6, 5, 4, 3, 2, 1, 0); \
  70044   float16x4_t __rev2_858;  __rev2_858 = __builtin_shufflevector(__s2_858, __s2_858, 3, 2, 1, 0); \
  70045   __ret_858 = __noswap_vfmlalq_high_f16(__rev0_858, __rev1_858, (float16x8_t) {__noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858)}); \
  70046   __ret_858 = __builtin_shufflevector(__ret_858, __ret_858, 3, 2, 1, 0); \
  70047   __ret_858; \
  70048 })
  70049 #endif
  70050 
  70051 #ifdef __LITTLE_ENDIAN__
  70052 #define vfmlal_lane_high_f16(__p0_859, __p1_859, __p2_859, __p3_859) __extension__ ({ \
  70053   float32x2_t __ret_859; \
  70054   float32x2_t __s0_859 = __p0_859; \
  70055   float16x4_t __s1_859 = __p1_859; \
  70056   float16x4_t __s2_859 = __p2_859; \
  70057   __ret_859 = vfmlal_high_f16(__s0_859, __s1_859, (float16x4_t) {vget_lane_f16(__s2_859, __p3_859), vget_lane_f16(__s2_859, __p3_859), vget_lane_f16(__s2_859, __p3_859), vget_lane_f16(__s2_859, __p3_859)}); \
  70058   __ret_859; \
  70059 })
  70060 #else
  70061 #define vfmlal_lane_high_f16(__p0_860, __p1_860, __p2_860, __p3_860) __extension__ ({ \
  70062   float32x2_t __ret_860; \
  70063   float32x2_t __s0_860 = __p0_860; \
  70064   float16x4_t __s1_860 = __p1_860; \
  70065   float16x4_t __s2_860 = __p2_860; \
  70066   float32x2_t __rev0_860;  __rev0_860 = __builtin_shufflevector(__s0_860, __s0_860, 1, 0); \
  70067   float16x4_t __rev1_860;  __rev1_860 = __builtin_shufflevector(__s1_860, __s1_860, 3, 2, 1, 0); \
  70068   float16x4_t __rev2_860;  __rev2_860 = __builtin_shufflevector(__s2_860, __s2_860, 3, 2, 1, 0); \
  70069   __ret_860 = __noswap_vfmlal_high_f16(__rev0_860, __rev1_860, (float16x4_t) {__noswap_vget_lane_f16(__rev2_860, __p3_860), __noswap_vget_lane_f16(__rev2_860, __p3_860), __noswap_vget_lane_f16(__rev2_860, __p3_860), __noswap_vget_lane_f16(__rev2_860, __p3_860)}); \
  70070   __ret_860 = __builtin_shufflevector(__ret_860, __ret_860, 1, 0); \
  70071   __ret_860; \
  70072 })
  70073 #endif
  70074 
  70075 #ifdef __LITTLE_ENDIAN__
  70076 #define vfmlalq_lane_low_f16(__p0_861, __p1_861, __p2_861, __p3_861) __extension__ ({ \
  70077   float32x4_t __ret_861; \
  70078   float32x4_t __s0_861 = __p0_861; \
  70079   float16x8_t __s1_861 = __p1_861; \
  70080   float16x4_t __s2_861 = __p2_861; \
  70081   __ret_861 = vfmlalq_low_f16(__s0_861, __s1_861, (float16x8_t) {vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861)}); \
  70082   __ret_861; \
  70083 })
  70084 #else
  70085 #define vfmlalq_lane_low_f16(__p0_862, __p1_862, __p2_862, __p3_862) __extension__ ({ \
  70086   float32x4_t __ret_862; \
  70087   float32x4_t __s0_862 = __p0_862; \
  70088   float16x8_t __s1_862 = __p1_862; \
  70089   float16x4_t __s2_862 = __p2_862; \
  70090   float32x4_t __rev0_862;  __rev0_862 = __builtin_shufflevector(__s0_862, __s0_862, 3, 2, 1, 0); \
  70091   float16x8_t __rev1_862;  __rev1_862 = __builtin_shufflevector(__s1_862, __s1_862, 7, 6, 5, 4, 3, 2, 1, 0); \
  70092   float16x4_t __rev2_862;  __rev2_862 = __builtin_shufflevector(__s2_862, __s2_862, 3, 2, 1, 0); \
  70093   __ret_862 = __noswap_vfmlalq_low_f16(__rev0_862, __rev1_862, (float16x8_t) {__noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862)}); \
  70094   __ret_862 = __builtin_shufflevector(__ret_862, __ret_862, 3, 2, 1, 0); \
  70095   __ret_862; \
  70096 })
  70097 #endif
  70098 
  70099 #ifdef __LITTLE_ENDIAN__
  70100 #define vfmlal_lane_low_f16(__p0_863, __p1_863, __p2_863, __p3_863) __extension__ ({ \
  70101   float32x2_t __ret_863; \
  70102   float32x2_t __s0_863 = __p0_863; \
  70103   float16x4_t __s1_863 = __p1_863; \
  70104   float16x4_t __s2_863 = __p2_863; \
  70105   __ret_863 = vfmlal_low_f16(__s0_863, __s1_863, (float16x4_t) {vget_lane_f16(__s2_863, __p3_863), vget_lane_f16(__s2_863, __p3_863), vget_lane_f16(__s2_863, __p3_863), vget_lane_f16(__s2_863, __p3_863)}); \
  70106   __ret_863; \
  70107 })
  70108 #else
  70109 #define vfmlal_lane_low_f16(__p0_864, __p1_864, __p2_864, __p3_864) __extension__ ({ \
  70110   float32x2_t __ret_864; \
  70111   float32x2_t __s0_864 = __p0_864; \
  70112   float16x4_t __s1_864 = __p1_864; \
  70113   float16x4_t __s2_864 = __p2_864; \
  70114   float32x2_t __rev0_864;  __rev0_864 = __builtin_shufflevector(__s0_864, __s0_864, 1, 0); \
  70115   float16x4_t __rev1_864;  __rev1_864 = __builtin_shufflevector(__s1_864, __s1_864, 3, 2, 1, 0); \
  70116   float16x4_t __rev2_864;  __rev2_864 = __builtin_shufflevector(__s2_864, __s2_864, 3, 2, 1, 0); \
  70117   __ret_864 = __noswap_vfmlal_low_f16(__rev0_864, __rev1_864, (float16x4_t) {__noswap_vget_lane_f16(__rev2_864, __p3_864), __noswap_vget_lane_f16(__rev2_864, __p3_864), __noswap_vget_lane_f16(__rev2_864, __p3_864), __noswap_vget_lane_f16(__rev2_864, __p3_864)}); \
  70118   __ret_864 = __builtin_shufflevector(__ret_864, __ret_864, 1, 0); \
  70119   __ret_864; \
  70120 })
  70121 #endif
  70122 
  70123 #ifdef __LITTLE_ENDIAN__
  70124 #define vfmlalq_laneq_high_f16(__p0_865, __p1_865, __p2_865, __p3_865) __extension__ ({ \
  70125   float32x4_t __ret_865; \
  70126   float32x4_t __s0_865 = __p0_865; \
  70127   float16x8_t __s1_865 = __p1_865; \
  70128   float16x8_t __s2_865 = __p2_865; \
  70129   __ret_865 = vfmlalq_high_f16(__s0_865, __s1_865, (float16x8_t) {vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865)}); \
  70130   __ret_865; \
  70131 })
  70132 #else
  70133 #define vfmlalq_laneq_high_f16(__p0_866, __p1_866, __p2_866, __p3_866) __extension__ ({ \
  70134   float32x4_t __ret_866; \
  70135   float32x4_t __s0_866 = __p0_866; \
  70136   float16x8_t __s1_866 = __p1_866; \
  70137   float16x8_t __s2_866 = __p2_866; \
  70138   float32x4_t __rev0_866;  __rev0_866 = __builtin_shufflevector(__s0_866, __s0_866, 3, 2, 1, 0); \
  70139   float16x8_t __rev1_866;  __rev1_866 = __builtin_shufflevector(__s1_866, __s1_866, 7, 6, 5, 4, 3, 2, 1, 0); \
  70140   float16x8_t __rev2_866;  __rev2_866 = __builtin_shufflevector(__s2_866, __s2_866, 7, 6, 5, 4, 3, 2, 1, 0); \
  70141   __ret_866 = __noswap_vfmlalq_high_f16(__rev0_866, __rev1_866, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866)}); \
  70142   __ret_866 = __builtin_shufflevector(__ret_866, __ret_866, 3, 2, 1, 0); \
  70143   __ret_866; \
  70144 })
  70145 #endif
  70146 
  70147 #ifdef __LITTLE_ENDIAN__
  70148 #define vfmlal_laneq_high_f16(__p0_867, __p1_867, __p2_867, __p3_867) __extension__ ({ \
  70149   float32x2_t __ret_867; \
  70150   float32x2_t __s0_867 = __p0_867; \
  70151   float16x4_t __s1_867 = __p1_867; \
  70152   float16x8_t __s2_867 = __p2_867; \
  70153   __ret_867 = vfmlal_high_f16(__s0_867, __s1_867, (float16x4_t) {vgetq_lane_f16(__s2_867, __p3_867), vgetq_lane_f16(__s2_867, __p3_867), vgetq_lane_f16(__s2_867, __p3_867), vgetq_lane_f16(__s2_867, __p3_867)}); \
  70154   __ret_867; \
  70155 })
  70156 #else
  70157 #define vfmlal_laneq_high_f16(__p0_868, __p1_868, __p2_868, __p3_868) __extension__ ({ \
  70158   float32x2_t __ret_868; \
  70159   float32x2_t __s0_868 = __p0_868; \
  70160   float16x4_t __s1_868 = __p1_868; \
  70161   float16x8_t __s2_868 = __p2_868; \
  70162   float32x2_t __rev0_868;  __rev0_868 = __builtin_shufflevector(__s0_868, __s0_868, 1, 0); \
  70163   float16x4_t __rev1_868;  __rev1_868 = __builtin_shufflevector(__s1_868, __s1_868, 3, 2, 1, 0); \
  70164   float16x8_t __rev2_868;  __rev2_868 = __builtin_shufflevector(__s2_868, __s2_868, 7, 6, 5, 4, 3, 2, 1, 0); \
  70165   __ret_868 = __noswap_vfmlal_high_f16(__rev0_868, __rev1_868, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_868, __p3_868), __noswap_vgetq_lane_f16(__rev2_868, __p3_868), __noswap_vgetq_lane_f16(__rev2_868, __p3_868), __noswap_vgetq_lane_f16(__rev2_868, __p3_868)}); \
  70166   __ret_868 = __builtin_shufflevector(__ret_868, __ret_868, 1, 0); \
  70167   __ret_868; \
  70168 })
  70169 #endif
  70170 
  70171 #ifdef __LITTLE_ENDIAN__
  70172 #define vfmlalq_laneq_low_f16(__p0_869, __p1_869, __p2_869, __p3_869) __extension__ ({ \
  70173   float32x4_t __ret_869; \
  70174   float32x4_t __s0_869 = __p0_869; \
  70175   float16x8_t __s1_869 = __p1_869; \
  70176   float16x8_t __s2_869 = __p2_869; \
  70177   __ret_869 = vfmlalq_low_f16(__s0_869, __s1_869, (float16x8_t) {vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869)}); \
  70178   __ret_869; \
  70179 })
  70180 #else
  70181 #define vfmlalq_laneq_low_f16(__p0_870, __p1_870, __p2_870, __p3_870) __extension__ ({ \
  70182   float32x4_t __ret_870; \
  70183   float32x4_t __s0_870 = __p0_870; \
  70184   float16x8_t __s1_870 = __p1_870; \
  70185   float16x8_t __s2_870 = __p2_870; \
  70186   float32x4_t __rev0_870;  __rev0_870 = __builtin_shufflevector(__s0_870, __s0_870, 3, 2, 1, 0); \
  70187   float16x8_t __rev1_870;  __rev1_870 = __builtin_shufflevector(__s1_870, __s1_870, 7, 6, 5, 4, 3, 2, 1, 0); \
  70188   float16x8_t __rev2_870;  __rev2_870 = __builtin_shufflevector(__s2_870, __s2_870, 7, 6, 5, 4, 3, 2, 1, 0); \
  70189   __ret_870 = __noswap_vfmlalq_low_f16(__rev0_870, __rev1_870, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870)}); \
  70190   __ret_870 = __builtin_shufflevector(__ret_870, __ret_870, 3, 2, 1, 0); \
  70191   __ret_870; \
  70192 })
  70193 #endif
  70194 
  70195 #ifdef __LITTLE_ENDIAN__
  70196 #define vfmlal_laneq_low_f16(__p0_871, __p1_871, __p2_871, __p3_871) __extension__ ({ \
  70197   float32x2_t __ret_871; \
  70198   float32x2_t __s0_871 = __p0_871; \
  70199   float16x4_t __s1_871 = __p1_871; \
  70200   float16x8_t __s2_871 = __p2_871; \
  70201   __ret_871 = vfmlal_low_f16(__s0_871, __s1_871, (float16x4_t) {vgetq_lane_f16(__s2_871, __p3_871), vgetq_lane_f16(__s2_871, __p3_871), vgetq_lane_f16(__s2_871, __p3_871), vgetq_lane_f16(__s2_871, __p3_871)}); \
  70202   __ret_871; \
  70203 })
  70204 #else
  70205 #define vfmlal_laneq_low_f16(__p0_872, __p1_872, __p2_872, __p3_872) __extension__ ({ \
  70206   float32x2_t __ret_872; \
  70207   float32x2_t __s0_872 = __p0_872; \
  70208   float16x4_t __s1_872 = __p1_872; \
  70209   float16x8_t __s2_872 = __p2_872; \
  70210   float32x2_t __rev0_872;  __rev0_872 = __builtin_shufflevector(__s0_872, __s0_872, 1, 0); \
  70211   float16x4_t __rev1_872;  __rev1_872 = __builtin_shufflevector(__s1_872, __s1_872, 3, 2, 1, 0); \
  70212   float16x8_t __rev2_872;  __rev2_872 = __builtin_shufflevector(__s2_872, __s2_872, 7, 6, 5, 4, 3, 2, 1, 0); \
  70213   __ret_872 = __noswap_vfmlal_low_f16(__rev0_872, __rev1_872, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_872, __p3_872), __noswap_vgetq_lane_f16(__rev2_872, __p3_872), __noswap_vgetq_lane_f16(__rev2_872, __p3_872), __noswap_vgetq_lane_f16(__rev2_872, __p3_872)}); \
  70214   __ret_872 = __builtin_shufflevector(__ret_872, __ret_872, 1, 0); \
  70215   __ret_872; \
  70216 })
  70217 #endif
  70218 
  70219 #ifdef __LITTLE_ENDIAN__
  70220 #define vfmlslq_lane_high_f16(__p0_873, __p1_873, __p2_873, __p3_873) __extension__ ({ \
  70221   float32x4_t __ret_873; \
  70222   float32x4_t __s0_873 = __p0_873; \
  70223   float16x8_t __s1_873 = __p1_873; \
  70224   float16x4_t __s2_873 = __p2_873; \
  70225   __ret_873 = vfmlslq_high_f16(__s0_873, __s1_873, (float16x8_t) {vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873)}); \
  70226   __ret_873; \
  70227 })
  70228 #else
  70229 #define vfmlslq_lane_high_f16(__p0_874, __p1_874, __p2_874, __p3_874) __extension__ ({ \
  70230   float32x4_t __ret_874; \
  70231   float32x4_t __s0_874 = __p0_874; \
  70232   float16x8_t __s1_874 = __p1_874; \
  70233   float16x4_t __s2_874 = __p2_874; \
  70234   float32x4_t __rev0_874;  __rev0_874 = __builtin_shufflevector(__s0_874, __s0_874, 3, 2, 1, 0); \
  70235   float16x8_t __rev1_874;  __rev1_874 = __builtin_shufflevector(__s1_874, __s1_874, 7, 6, 5, 4, 3, 2, 1, 0); \
  70236   float16x4_t __rev2_874;  __rev2_874 = __builtin_shufflevector(__s2_874, __s2_874, 3, 2, 1, 0); \
  70237   __ret_874 = __noswap_vfmlslq_high_f16(__rev0_874, __rev1_874, (float16x8_t) {__noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874)}); \
  70238   __ret_874 = __builtin_shufflevector(__ret_874, __ret_874, 3, 2, 1, 0); \
  70239   __ret_874; \
  70240 })
  70241 #endif
  70242 
  70243 #ifdef __LITTLE_ENDIAN__
  70244 #define vfmlsl_lane_high_f16(__p0_875, __p1_875, __p2_875, __p3_875) __extension__ ({ \
  70245   float32x2_t __ret_875; \
  70246   float32x2_t __s0_875 = __p0_875; \
  70247   float16x4_t __s1_875 = __p1_875; \
  70248   float16x4_t __s2_875 = __p2_875; \
  70249   __ret_875 = vfmlsl_high_f16(__s0_875, __s1_875, (float16x4_t) {vget_lane_f16(__s2_875, __p3_875), vget_lane_f16(__s2_875, __p3_875), vget_lane_f16(__s2_875, __p3_875), vget_lane_f16(__s2_875, __p3_875)}); \
  70250   __ret_875; \
  70251 })
  70252 #else
  70253 #define vfmlsl_lane_high_f16(__p0_876, __p1_876, __p2_876, __p3_876) __extension__ ({ \
  70254   float32x2_t __ret_876; \
  70255   float32x2_t __s0_876 = __p0_876; \
  70256   float16x4_t __s1_876 = __p1_876; \
  70257   float16x4_t __s2_876 = __p2_876; \
  70258   float32x2_t __rev0_876;  __rev0_876 = __builtin_shufflevector(__s0_876, __s0_876, 1, 0); \
  70259   float16x4_t __rev1_876;  __rev1_876 = __builtin_shufflevector(__s1_876, __s1_876, 3, 2, 1, 0); \
  70260   float16x4_t __rev2_876;  __rev2_876 = __builtin_shufflevector(__s2_876, __s2_876, 3, 2, 1, 0); \
  70261   __ret_876 = __noswap_vfmlsl_high_f16(__rev0_876, __rev1_876, (float16x4_t) {__noswap_vget_lane_f16(__rev2_876, __p3_876), __noswap_vget_lane_f16(__rev2_876, __p3_876), __noswap_vget_lane_f16(__rev2_876, __p3_876), __noswap_vget_lane_f16(__rev2_876, __p3_876)}); \
  70262   __ret_876 = __builtin_shufflevector(__ret_876, __ret_876, 1, 0); \
  70263   __ret_876; \
  70264 })
  70265 #endif
  70266 
  70267 #ifdef __LITTLE_ENDIAN__
  70268 #define vfmlslq_lane_low_f16(__p0_877, __p1_877, __p2_877, __p3_877) __extension__ ({ \
  70269   float32x4_t __ret_877; \
  70270   float32x4_t __s0_877 = __p0_877; \
  70271   float16x8_t __s1_877 = __p1_877; \
  70272   float16x4_t __s2_877 = __p2_877; \
  70273   __ret_877 = vfmlslq_low_f16(__s0_877, __s1_877, (float16x8_t) {vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877)}); \
  70274   __ret_877; \
  70275 })
  70276 #else
  70277 #define vfmlslq_lane_low_f16(__p0_878, __p1_878, __p2_878, __p3_878) __extension__ ({ \
  70278   float32x4_t __ret_878; \
  70279   float32x4_t __s0_878 = __p0_878; \
  70280   float16x8_t __s1_878 = __p1_878; \
  70281   float16x4_t __s2_878 = __p2_878; \
  70282   float32x4_t __rev0_878;  __rev0_878 = __builtin_shufflevector(__s0_878, __s0_878, 3, 2, 1, 0); \
  70283   float16x8_t __rev1_878;  __rev1_878 = __builtin_shufflevector(__s1_878, __s1_878, 7, 6, 5, 4, 3, 2, 1, 0); \
  70284   float16x4_t __rev2_878;  __rev2_878 = __builtin_shufflevector(__s2_878, __s2_878, 3, 2, 1, 0); \
  70285   __ret_878 = __noswap_vfmlslq_low_f16(__rev0_878, __rev1_878, (float16x8_t) {__noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878)}); \
  70286   __ret_878 = __builtin_shufflevector(__ret_878, __ret_878, 3, 2, 1, 0); \
  70287   __ret_878; \
  70288 })
  70289 #endif
  70290 
  70291 #ifdef __LITTLE_ENDIAN__
  70292 #define vfmlsl_lane_low_f16(__p0_879, __p1_879, __p2_879, __p3_879) __extension__ ({ \
  70293   float32x2_t __ret_879; \
  70294   float32x2_t __s0_879 = __p0_879; \
  70295   float16x4_t __s1_879 = __p1_879; \
  70296   float16x4_t __s2_879 = __p2_879; \
  70297   __ret_879 = vfmlsl_low_f16(__s0_879, __s1_879, (float16x4_t) {vget_lane_f16(__s2_879, __p3_879), vget_lane_f16(__s2_879, __p3_879), vget_lane_f16(__s2_879, __p3_879), vget_lane_f16(__s2_879, __p3_879)}); \
  70298   __ret_879; \
  70299 })
  70300 #else
  70301 #define vfmlsl_lane_low_f16(__p0_880, __p1_880, __p2_880, __p3_880) __extension__ ({ \
  70302   float32x2_t __ret_880; \
  70303   float32x2_t __s0_880 = __p0_880; \
  70304   float16x4_t __s1_880 = __p1_880; \
  70305   float16x4_t __s2_880 = __p2_880; \
  70306   float32x2_t __rev0_880;  __rev0_880 = __builtin_shufflevector(__s0_880, __s0_880, 1, 0); \
  70307   float16x4_t __rev1_880;  __rev1_880 = __builtin_shufflevector(__s1_880, __s1_880, 3, 2, 1, 0); \
  70308   float16x4_t __rev2_880;  __rev2_880 = __builtin_shufflevector(__s2_880, __s2_880, 3, 2, 1, 0); \
  70309   __ret_880 = __noswap_vfmlsl_low_f16(__rev0_880, __rev1_880, (float16x4_t) {__noswap_vget_lane_f16(__rev2_880, __p3_880), __noswap_vget_lane_f16(__rev2_880, __p3_880), __noswap_vget_lane_f16(__rev2_880, __p3_880), __noswap_vget_lane_f16(__rev2_880, __p3_880)}); \
  70310   __ret_880 = __builtin_shufflevector(__ret_880, __ret_880, 1, 0); \
  70311   __ret_880; \
  70312 })
  70313 #endif
  70314 
  70315 #ifdef __LITTLE_ENDIAN__
  70316 #define vfmlslq_laneq_high_f16(__p0_881, __p1_881, __p2_881, __p3_881) __extension__ ({ \
  70317   float32x4_t __ret_881; \
  70318   float32x4_t __s0_881 = __p0_881; \
  70319   float16x8_t __s1_881 = __p1_881; \
  70320   float16x8_t __s2_881 = __p2_881; \
  70321   __ret_881 = vfmlslq_high_f16(__s0_881, __s1_881, (float16x8_t) {vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881)}); \
  70322   __ret_881; \
  70323 })
  70324 #else
  70325 #define vfmlslq_laneq_high_f16(__p0_882, __p1_882, __p2_882, __p3_882) __extension__ ({ \
  70326   float32x4_t __ret_882; \
  70327   float32x4_t __s0_882 = __p0_882; \
  70328   float16x8_t __s1_882 = __p1_882; \
  70329   float16x8_t __s2_882 = __p2_882; \
  70330   float32x4_t __rev0_882;  __rev0_882 = __builtin_shufflevector(__s0_882, __s0_882, 3, 2, 1, 0); \
  70331   float16x8_t __rev1_882;  __rev1_882 = __builtin_shufflevector(__s1_882, __s1_882, 7, 6, 5, 4, 3, 2, 1, 0); \
  70332   float16x8_t __rev2_882;  __rev2_882 = __builtin_shufflevector(__s2_882, __s2_882, 7, 6, 5, 4, 3, 2, 1, 0); \
  70333   __ret_882 = __noswap_vfmlslq_high_f16(__rev0_882, __rev1_882, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882)}); \
  70334   __ret_882 = __builtin_shufflevector(__ret_882, __ret_882, 3, 2, 1, 0); \
  70335   __ret_882; \
  70336 })
  70337 #endif
  70338 
  70339 #ifdef __LITTLE_ENDIAN__
  70340 #define vfmlsl_laneq_high_f16(__p0_883, __p1_883, __p2_883, __p3_883) __extension__ ({ \
  70341   float32x2_t __ret_883; \
  70342   float32x2_t __s0_883 = __p0_883; \
  70343   float16x4_t __s1_883 = __p1_883; \
  70344   float16x8_t __s2_883 = __p2_883; \
  70345   __ret_883 = vfmlsl_high_f16(__s0_883, __s1_883, (float16x4_t) {vgetq_lane_f16(__s2_883, __p3_883), vgetq_lane_f16(__s2_883, __p3_883), vgetq_lane_f16(__s2_883, __p3_883), vgetq_lane_f16(__s2_883, __p3_883)}); \
  70346   __ret_883; \
  70347 })
  70348 #else
  70349 #define vfmlsl_laneq_high_f16(__p0_884, __p1_884, __p2_884, __p3_884) __extension__ ({ \
  70350   float32x2_t __ret_884; \
  70351   float32x2_t __s0_884 = __p0_884; \
  70352   float16x4_t __s1_884 = __p1_884; \
  70353   float16x8_t __s2_884 = __p2_884; \
  70354   float32x2_t __rev0_884;  __rev0_884 = __builtin_shufflevector(__s0_884, __s0_884, 1, 0); \
  70355   float16x4_t __rev1_884;  __rev1_884 = __builtin_shufflevector(__s1_884, __s1_884, 3, 2, 1, 0); \
  70356   float16x8_t __rev2_884;  __rev2_884 = __builtin_shufflevector(__s2_884, __s2_884, 7, 6, 5, 4, 3, 2, 1, 0); \
  70357   __ret_884 = __noswap_vfmlsl_high_f16(__rev0_884, __rev1_884, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_884, __p3_884), __noswap_vgetq_lane_f16(__rev2_884, __p3_884), __noswap_vgetq_lane_f16(__rev2_884, __p3_884), __noswap_vgetq_lane_f16(__rev2_884, __p3_884)}); \
  70358   __ret_884 = __builtin_shufflevector(__ret_884, __ret_884, 1, 0); \
  70359   __ret_884; \
  70360 })
  70361 #endif
  70362 
  70363 #ifdef __LITTLE_ENDIAN__
  70364 #define vfmlslq_laneq_low_f16(__p0_885, __p1_885, __p2_885, __p3_885) __extension__ ({ \
  70365   float32x4_t __ret_885; \
  70366   float32x4_t __s0_885 = __p0_885; \
  70367   float16x8_t __s1_885 = __p1_885; \
  70368   float16x8_t __s2_885 = __p2_885; \
  70369   __ret_885 = vfmlslq_low_f16(__s0_885, __s1_885, (float16x8_t) {vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885)}); \
  70370   __ret_885; \
  70371 })
  70372 #else
  70373 #define vfmlslq_laneq_low_f16(__p0_886, __p1_886, __p2_886, __p3_886) __extension__ ({ \
  70374   float32x4_t __ret_886; \
  70375   float32x4_t __s0_886 = __p0_886; \
  70376   float16x8_t __s1_886 = __p1_886; \
  70377   float16x8_t __s2_886 = __p2_886; \
  70378   float32x4_t __rev0_886;  __rev0_886 = __builtin_shufflevector(__s0_886, __s0_886, 3, 2, 1, 0); \
  70379   float16x8_t __rev1_886;  __rev1_886 = __builtin_shufflevector(__s1_886, __s1_886, 7, 6, 5, 4, 3, 2, 1, 0); \
  70380   float16x8_t __rev2_886;  __rev2_886 = __builtin_shufflevector(__s2_886, __s2_886, 7, 6, 5, 4, 3, 2, 1, 0); \
  70381   __ret_886 = __noswap_vfmlslq_low_f16(__rev0_886, __rev1_886, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886)}); \
  70382   __ret_886 = __builtin_shufflevector(__ret_886, __ret_886, 3, 2, 1, 0); \
  70383   __ret_886; \
  70384 })
  70385 #endif
  70386 
  70387 #ifdef __LITTLE_ENDIAN__
  70388 #define vfmlsl_laneq_low_f16(__p0_887, __p1_887, __p2_887, __p3_887) __extension__ ({ \
  70389   float32x2_t __ret_887; \
  70390   float32x2_t __s0_887 = __p0_887; \
  70391   float16x4_t __s1_887 = __p1_887; \
  70392   float16x8_t __s2_887 = __p2_887; \
  70393   __ret_887 = vfmlsl_low_f16(__s0_887, __s1_887, (float16x4_t) {vgetq_lane_f16(__s2_887, __p3_887), vgetq_lane_f16(__s2_887, __p3_887), vgetq_lane_f16(__s2_887, __p3_887), vgetq_lane_f16(__s2_887, __p3_887)}); \
  70394   __ret_887; \
  70395 })
  70396 #else
  70397 #define vfmlsl_laneq_low_f16(__p0_888, __p1_888, __p2_888, __p3_888) __extension__ ({ \
  70398   float32x2_t __ret_888; \
  70399   float32x2_t __s0_888 = __p0_888; \
  70400   float16x4_t __s1_888 = __p1_888; \
  70401   float16x8_t __s2_888 = __p2_888; \
  70402   float32x2_t __rev0_888;  __rev0_888 = __builtin_shufflevector(__s0_888, __s0_888, 1, 0); \
  70403   float16x4_t __rev1_888;  __rev1_888 = __builtin_shufflevector(__s1_888, __s1_888, 3, 2, 1, 0); \
  70404   float16x8_t __rev2_888;  __rev2_888 = __builtin_shufflevector(__s2_888, __s2_888, 7, 6, 5, 4, 3, 2, 1, 0); \
  70405   __ret_888 = __noswap_vfmlsl_low_f16(__rev0_888, __rev1_888, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_888, __p3_888), __noswap_vgetq_lane_f16(__rev2_888, __p3_888), __noswap_vgetq_lane_f16(__rev2_888, __p3_888), __noswap_vgetq_lane_f16(__rev2_888, __p3_888)}); \
  70406   __ret_888 = __builtin_shufflevector(__ret_888, __ret_888, 1, 0); \
  70407   __ret_888; \
  70408 })
  70409 #endif
  70410 
  70411 #ifdef __LITTLE_ENDIAN__
  70412 #define vmulh_lane_f16(__p0_889, __p1_889, __p2_889) __extension__ ({ \
  70413   float16_t __ret_889; \
  70414   float16_t __s0_889 = __p0_889; \
  70415   float16x4_t __s1_889 = __p1_889; \
  70416   __ret_889 = __s0_889 * vget_lane_f16(__s1_889, __p2_889); \
  70417   __ret_889; \
  70418 })
  70419 #else
  70420 #define vmulh_lane_f16(__p0_890, __p1_890, __p2_890) __extension__ ({ \
  70421   float16_t __ret_890; \
  70422   float16_t __s0_890 = __p0_890; \
  70423   float16x4_t __s1_890 = __p1_890; \
  70424   float16x4_t __rev1_890;  __rev1_890 = __builtin_shufflevector(__s1_890, __s1_890, 3, 2, 1, 0); \
  70425   __ret_890 = __s0_890 * __noswap_vget_lane_f16(__rev1_890, __p2_890); \
  70426   __ret_890; \
  70427 })
  70428 #endif
  70429 
  70430 #ifdef __LITTLE_ENDIAN__
  70431 #define vmulh_laneq_f16(__p0_891, __p1_891, __p2_891) __extension__ ({ \
  70432   float16_t __ret_891; \
  70433   float16_t __s0_891 = __p0_891; \
  70434   float16x8_t __s1_891 = __p1_891; \
  70435   __ret_891 = __s0_891 * vgetq_lane_f16(__s1_891, __p2_891); \
  70436   __ret_891; \
  70437 })
  70438 #else
  70439 #define vmulh_laneq_f16(__p0_892, __p1_892, __p2_892) __extension__ ({ \
  70440   float16_t __ret_892; \
  70441   float16_t __s0_892 = __p0_892; \
  70442   float16x8_t __s1_892 = __p1_892; \
  70443   float16x8_t __rev1_892;  __rev1_892 = __builtin_shufflevector(__s1_892, __s1_892, 7, 6, 5, 4, 3, 2, 1, 0); \
  70444   __ret_892 = __s0_892 * __noswap_vgetq_lane_f16(__rev1_892, __p2_892); \
  70445   __ret_892; \
  70446 })
  70447 #endif
  70448 
  70449 #ifdef __LITTLE_ENDIAN__
  70450 __ai __attribute__((target("neon"))) uint16x8_t vabdl_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  70451   uint16x8_t __ret;
  70452   __ret = vabdl_u8(vget_high_u8(__p0), vget_high_u8(__p1));
  70453   return __ret;
  70454 }
  70455 #else
  70456 __ai __attribute__((target("neon"))) uint16x8_t vabdl_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  70457   uint16x8_t __ret;
  70458   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70459   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70460   __ret = __noswap_vabdl_u8(__noswap_vget_high_u8(__rev0), __noswap_vget_high_u8(__rev1));
  70461   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70462   return __ret;
  70463 }
  70464 #endif
  70465 
  70466 #ifdef __LITTLE_ENDIAN__
  70467 __ai __attribute__((target("neon"))) uint64x2_t vabdl_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  70468   uint64x2_t __ret;
  70469   __ret = vabdl_u32(vget_high_u32(__p0), vget_high_u32(__p1));
  70470   return __ret;
  70471 }
  70472 #else
  70473 __ai __attribute__((target("neon"))) uint64x2_t vabdl_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  70474   uint64x2_t __ret;
  70475   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70476   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70477   __ret = __noswap_vabdl_u32(__noswap_vget_high_u32(__rev0), __noswap_vget_high_u32(__rev1));
  70478   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70479   return __ret;
  70480 }
  70481 #endif
  70482 
  70483 #ifdef __LITTLE_ENDIAN__
  70484 __ai __attribute__((target("neon"))) uint32x4_t vabdl_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  70485   uint32x4_t __ret;
  70486   __ret = vabdl_u16(vget_high_u16(__p0), vget_high_u16(__p1));
  70487   return __ret;
  70488 }
  70489 #else
  70490 __ai __attribute__((target("neon"))) uint32x4_t vabdl_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  70491   uint32x4_t __ret;
  70492   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70493   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70494   __ret = __noswap_vabdl_u16(__noswap_vget_high_u16(__rev0), __noswap_vget_high_u16(__rev1));
  70495   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70496   return __ret;
  70497 }
  70498 #endif
  70499 
  70500 #ifdef __LITTLE_ENDIAN__
  70501 __ai __attribute__((target("neon"))) int16x8_t vabdl_high_s8(int8x16_t __p0, int8x16_t __p1) {
  70502   int16x8_t __ret;
  70503   __ret = vabdl_s8(vget_high_s8(__p0), vget_high_s8(__p1));
  70504   return __ret;
  70505 }
  70506 #else
  70507 __ai __attribute__((target("neon"))) int16x8_t vabdl_high_s8(int8x16_t __p0, int8x16_t __p1) {
  70508   int16x8_t __ret;
  70509   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70510   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70511   __ret = __noswap_vabdl_s8(__noswap_vget_high_s8(__rev0), __noswap_vget_high_s8(__rev1));
  70512   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70513   return __ret;
  70514 }
  70515 #endif
  70516 
  70517 #ifdef __LITTLE_ENDIAN__
  70518 __ai __attribute__((target("neon"))) int64x2_t vabdl_high_s32(int32x4_t __p0, int32x4_t __p1) {
  70519   int64x2_t __ret;
  70520   __ret = vabdl_s32(vget_high_s32(__p0), vget_high_s32(__p1));
  70521   return __ret;
  70522 }
  70523 #else
  70524 __ai __attribute__((target("neon"))) int64x2_t vabdl_high_s32(int32x4_t __p0, int32x4_t __p1) {
  70525   int64x2_t __ret;
  70526   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70527   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70528   __ret = __noswap_vabdl_s32(__noswap_vget_high_s32(__rev0), __noswap_vget_high_s32(__rev1));
  70529   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70530   return __ret;
  70531 }
  70532 #endif
  70533 
  70534 #ifdef __LITTLE_ENDIAN__
  70535 __ai __attribute__((target("neon"))) int32x4_t vabdl_high_s16(int16x8_t __p0, int16x8_t __p1) {
  70536   int32x4_t __ret;
  70537   __ret = vabdl_s16(vget_high_s16(__p0), vget_high_s16(__p1));
  70538   return __ret;
  70539 }
  70540 #else
  70541 __ai __attribute__((target("neon"))) int32x4_t vabdl_high_s16(int16x8_t __p0, int16x8_t __p1) {
  70542   int32x4_t __ret;
  70543   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70544   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70545   __ret = __noswap_vabdl_s16(__noswap_vget_high_s16(__rev0), __noswap_vget_high_s16(__rev1));
  70546   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70547   return __ret;
  70548 }
  70549 #endif
  70550 
  70551 #ifdef __LITTLE_ENDIAN__
  70552 __ai __attribute__((target("neon"))) uint16x8_t vaddl_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  70553   uint16x8_t __ret;
  70554   __ret = vmovl_high_u8(__p0) + vmovl_high_u8(__p1);
  70555   return __ret;
  70556 }
  70557 #else
  70558 __ai __attribute__((target("neon"))) uint16x8_t vaddl_high_u8(uint8x16_t __p0, uint8x16_t __p1) {
  70559   uint16x8_t __ret;
  70560   uint8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70561   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70562   __ret = __noswap_vmovl_high_u8(__rev0) + __noswap_vmovl_high_u8(__rev1);
  70563   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70564   return __ret;
  70565 }
  70566 #endif
  70567 
  70568 #ifdef __LITTLE_ENDIAN__
  70569 __ai __attribute__((target("neon"))) uint64x2_t vaddl_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  70570   uint64x2_t __ret;
  70571   __ret = vmovl_high_u32(__p0) + vmovl_high_u32(__p1);
  70572   return __ret;
  70573 }
  70574 #else
  70575 __ai __attribute__((target("neon"))) uint64x2_t vaddl_high_u32(uint32x4_t __p0, uint32x4_t __p1) {
  70576   uint64x2_t __ret;
  70577   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70578   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70579   __ret = __noswap_vmovl_high_u32(__rev0) + __noswap_vmovl_high_u32(__rev1);
  70580   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70581   return __ret;
  70582 }
  70583 #endif
  70584 
  70585 #ifdef __LITTLE_ENDIAN__
  70586 __ai __attribute__((target("neon"))) uint32x4_t vaddl_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  70587   uint32x4_t __ret;
  70588   __ret = vmovl_high_u16(__p0) + vmovl_high_u16(__p1);
  70589   return __ret;
  70590 }
  70591 #else
  70592 __ai __attribute__((target("neon"))) uint32x4_t vaddl_high_u16(uint16x8_t __p0, uint16x8_t __p1) {
  70593   uint32x4_t __ret;
  70594   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70595   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70596   __ret = __noswap_vmovl_high_u16(__rev0) + __noswap_vmovl_high_u16(__rev1);
  70597   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70598   return __ret;
  70599 }
  70600 #endif
  70601 
  70602 #ifdef __LITTLE_ENDIAN__
  70603 __ai __attribute__((target("neon"))) int16x8_t vaddl_high_s8(int8x16_t __p0, int8x16_t __p1) {
  70604   int16x8_t __ret;
  70605   __ret = vmovl_high_s8(__p0) + vmovl_high_s8(__p1);
  70606   return __ret;
  70607 }
  70608 #else
  70609 __ai __attribute__((target("neon"))) int16x8_t vaddl_high_s8(int8x16_t __p0, int8x16_t __p1) {
  70610   int16x8_t __ret;
  70611   int8x16_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70612   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70613   __ret = __noswap_vmovl_high_s8(__rev0) + __noswap_vmovl_high_s8(__rev1);
  70614   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70615   return __ret;
  70616 }
  70617 #endif
  70618 
  70619 #ifdef __LITTLE_ENDIAN__
  70620 __ai __attribute__((target("neon"))) int64x2_t vaddl_high_s32(int32x4_t __p0, int32x4_t __p1) {
  70621   int64x2_t __ret;
  70622   __ret = vmovl_high_s32(__p0) + vmovl_high_s32(__p1);
  70623   return __ret;
  70624 }
  70625 #else
  70626 __ai __attribute__((target("neon"))) int64x2_t vaddl_high_s32(int32x4_t __p0, int32x4_t __p1) {
  70627   int64x2_t __ret;
  70628   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70629   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70630   __ret = __noswap_vmovl_high_s32(__rev0) + __noswap_vmovl_high_s32(__rev1);
  70631   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70632   return __ret;
  70633 }
  70634 #endif
  70635 
  70636 #ifdef __LITTLE_ENDIAN__
  70637 __ai __attribute__((target("neon"))) int32x4_t vaddl_high_s16(int16x8_t __p0, int16x8_t __p1) {
  70638   int32x4_t __ret;
  70639   __ret = vmovl_high_s16(__p0) + vmovl_high_s16(__p1);
  70640   return __ret;
  70641 }
  70642 #else
  70643 __ai __attribute__((target("neon"))) int32x4_t vaddl_high_s16(int16x8_t __p0, int16x8_t __p1) {
  70644   int32x4_t __ret;
  70645   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70646   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70647   __ret = __noswap_vmovl_high_s16(__rev0) + __noswap_vmovl_high_s16(__rev1);
  70648   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70649   return __ret;
  70650 }
  70651 #endif
  70652 
  70653 #ifdef __LITTLE_ENDIAN__
  70654 __ai __attribute__((target("neon"))) uint16x8_t vaddw_high_u8(uint16x8_t __p0, uint8x16_t __p1) {
  70655   uint16x8_t __ret;
  70656   __ret = __p0 + vmovl_high_u8(__p1);
  70657   return __ret;
  70658 }
  70659 #else
  70660 __ai __attribute__((target("neon"))) uint16x8_t vaddw_high_u8(uint16x8_t __p0, uint8x16_t __p1) {
  70661   uint16x8_t __ret;
  70662   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70663   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70664   __ret = __rev0 + __noswap_vmovl_high_u8(__rev1);
  70665   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70666   return __ret;
  70667 }
  70668 #endif
  70669 
  70670 #ifdef __LITTLE_ENDIAN__
  70671 __ai __attribute__((target("neon"))) uint64x2_t vaddw_high_u32(uint64x2_t __p0, uint32x4_t __p1) {
  70672   uint64x2_t __ret;
  70673   __ret = __p0 + vmovl_high_u32(__p1);
  70674   return __ret;
  70675 }
  70676 #else
  70677 __ai __attribute__((target("neon"))) uint64x2_t vaddw_high_u32(uint64x2_t __p0, uint32x4_t __p1) {
  70678   uint64x2_t __ret;
  70679   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  70680   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70681   __ret = __rev0 + __noswap_vmovl_high_u32(__rev1);
  70682   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70683   return __ret;
  70684 }
  70685 #endif
  70686 
  70687 #ifdef __LITTLE_ENDIAN__
  70688 __ai __attribute__((target("neon"))) uint32x4_t vaddw_high_u16(uint32x4_t __p0, uint16x8_t __p1) {
  70689   uint32x4_t __ret;
  70690   __ret = __p0 + vmovl_high_u16(__p1);
  70691   return __ret;
  70692 }
  70693 #else
  70694 __ai __attribute__((target("neon"))) uint32x4_t vaddw_high_u16(uint32x4_t __p0, uint16x8_t __p1) {
  70695   uint32x4_t __ret;
  70696   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70697   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70698   __ret = __rev0 + __noswap_vmovl_high_u16(__rev1);
  70699   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70700   return __ret;
  70701 }
  70702 #endif
  70703 
  70704 #ifdef __LITTLE_ENDIAN__
  70705 __ai __attribute__((target("neon"))) int16x8_t vaddw_high_s8(int16x8_t __p0, int8x16_t __p1) {
  70706   int16x8_t __ret;
  70707   __ret = __p0 + vmovl_high_s8(__p1);
  70708   return __ret;
  70709 }
  70710 #else
  70711 __ai __attribute__((target("neon"))) int16x8_t vaddw_high_s8(int16x8_t __p0, int8x16_t __p1) {
  70712   int16x8_t __ret;
  70713   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70714   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70715   __ret = __rev0 + __noswap_vmovl_high_s8(__rev1);
  70716   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70717   return __ret;
  70718 }
  70719 #endif
  70720 
  70721 #ifdef __LITTLE_ENDIAN__
  70722 __ai __attribute__((target("neon"))) int64x2_t vaddw_high_s32(int64x2_t __p0, int32x4_t __p1) {
  70723   int64x2_t __ret;
  70724   __ret = __p0 + vmovl_high_s32(__p1);
  70725   return __ret;
  70726 }
  70727 #else
  70728 __ai __attribute__((target("neon"))) int64x2_t vaddw_high_s32(int64x2_t __p0, int32x4_t __p1) {
  70729   int64x2_t __ret;
  70730   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  70731   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70732   __ret = __rev0 + __noswap_vmovl_high_s32(__rev1);
  70733   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70734   return __ret;
  70735 }
  70736 #endif
  70737 
  70738 #ifdef __LITTLE_ENDIAN__
  70739 __ai __attribute__((target("neon"))) int32x4_t vaddw_high_s16(int32x4_t __p0, int16x8_t __p1) {
  70740   int32x4_t __ret;
  70741   __ret = __p0 + vmovl_high_s16(__p1);
  70742   return __ret;
  70743 }
  70744 #else
  70745 __ai __attribute__((target("neon"))) int32x4_t vaddw_high_s16(int32x4_t __p0, int16x8_t __p1) {
  70746   int32x4_t __ret;
  70747   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70748   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70749   __ret = __rev0 + __noswap_vmovl_high_s16(__rev1);
  70750   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70751   return __ret;
  70752 }
  70753 #endif
  70754 
  70755 #ifdef __LITTLE_ENDIAN__
  70756 #define vcopyq_lane_p64(__p0_893, __p1_893, __p2_893, __p3_893) __extension__ ({ \
  70757   poly64x2_t __ret_893; \
  70758   poly64x2_t __s0_893 = __p0_893; \
  70759   poly64x1_t __s2_893 = __p2_893; \
  70760   __ret_893 = vsetq_lane_p64(vget_lane_p64(__s2_893, __p3_893), __s0_893, __p1_893); \
  70761   __ret_893; \
  70762 })
  70763 #else
  70764 #define vcopyq_lane_p64(__p0_894, __p1_894, __p2_894, __p3_894) __extension__ ({ \
  70765   poly64x2_t __ret_894; \
  70766   poly64x2_t __s0_894 = __p0_894; \
  70767   poly64x1_t __s2_894 = __p2_894; \
  70768   poly64x2_t __rev0_894;  __rev0_894 = __builtin_shufflevector(__s0_894, __s0_894, 1, 0); \
  70769   __ret_894 = __noswap_vsetq_lane_p64(vget_lane_p64(__s2_894, __p3_894), __rev0_894, __p1_894); \
  70770   __ret_894 = __builtin_shufflevector(__ret_894, __ret_894, 1, 0); \
  70771   __ret_894; \
  70772 })
  70773 #endif
  70774 
  70775 #ifdef __LITTLE_ENDIAN__
  70776 #define vcopyq_lane_f64(__p0_895, __p1_895, __p2_895, __p3_895) __extension__ ({ \
  70777   float64x2_t __ret_895; \
  70778   float64x2_t __s0_895 = __p0_895; \
  70779   float64x1_t __s2_895 = __p2_895; \
  70780   __ret_895 = vsetq_lane_f64(vget_lane_f64(__s2_895, __p3_895), __s0_895, __p1_895); \
  70781   __ret_895; \
  70782 })
  70783 #else
  70784 #define vcopyq_lane_f64(__p0_896, __p1_896, __p2_896, __p3_896) __extension__ ({ \
  70785   float64x2_t __ret_896; \
  70786   float64x2_t __s0_896 = __p0_896; \
  70787   float64x1_t __s2_896 = __p2_896; \
  70788   float64x2_t __rev0_896;  __rev0_896 = __builtin_shufflevector(__s0_896, __s0_896, 1, 0); \
  70789   __ret_896 = __noswap_vsetq_lane_f64(vget_lane_f64(__s2_896, __p3_896), __rev0_896, __p1_896); \
  70790   __ret_896 = __builtin_shufflevector(__ret_896, __ret_896, 1, 0); \
  70791   __ret_896; \
  70792 })
  70793 #endif
  70794 
  70795 #define vcopy_lane_p64(__p0_897, __p1_897, __p2_897, __p3_897) __extension__ ({ \
  70796   poly64x1_t __ret_897; \
  70797   poly64x1_t __s0_897 = __p0_897; \
  70798   poly64x1_t __s2_897 = __p2_897; \
  70799   __ret_897 = vset_lane_p64(vget_lane_p64(__s2_897, __p3_897), __s0_897, __p1_897); \
  70800   __ret_897; \
  70801 })
  70802 #define vcopy_lane_f64(__p0_898, __p1_898, __p2_898, __p3_898) __extension__ ({ \
  70803   float64x1_t __ret_898; \
  70804   float64x1_t __s0_898 = __p0_898; \
  70805   float64x1_t __s2_898 = __p2_898; \
  70806   __ret_898 = vset_lane_f64(vget_lane_f64(__s2_898, __p3_898), __s0_898, __p1_898); \
  70807   __ret_898; \
  70808 })
  70809 #ifdef __LITTLE_ENDIAN__
  70810 #define vcopyq_laneq_p64(__p0_899, __p1_899, __p2_899, __p3_899) __extension__ ({ \
  70811   poly64x2_t __ret_899; \
  70812   poly64x2_t __s0_899 = __p0_899; \
  70813   poly64x2_t __s2_899 = __p2_899; \
  70814   __ret_899 = vsetq_lane_p64(vgetq_lane_p64(__s2_899, __p3_899), __s0_899, __p1_899); \
  70815   __ret_899; \
  70816 })
  70817 #else
  70818 #define vcopyq_laneq_p64(__p0_900, __p1_900, __p2_900, __p3_900) __extension__ ({ \
  70819   poly64x2_t __ret_900; \
  70820   poly64x2_t __s0_900 = __p0_900; \
  70821   poly64x2_t __s2_900 = __p2_900; \
  70822   poly64x2_t __rev0_900;  __rev0_900 = __builtin_shufflevector(__s0_900, __s0_900, 1, 0); \
  70823   poly64x2_t __rev2_900;  __rev2_900 = __builtin_shufflevector(__s2_900, __s2_900, 1, 0); \
  70824   __ret_900 = __noswap_vsetq_lane_p64(__noswap_vgetq_lane_p64(__rev2_900, __p3_900), __rev0_900, __p1_900); \
  70825   __ret_900 = __builtin_shufflevector(__ret_900, __ret_900, 1, 0); \
  70826   __ret_900; \
  70827 })
  70828 #endif
  70829 
  70830 #ifdef __LITTLE_ENDIAN__
  70831 #define vcopyq_laneq_f64(__p0_901, __p1_901, __p2_901, __p3_901) __extension__ ({ \
  70832   float64x2_t __ret_901; \
  70833   float64x2_t __s0_901 = __p0_901; \
  70834   float64x2_t __s2_901 = __p2_901; \
  70835   __ret_901 = vsetq_lane_f64(vgetq_lane_f64(__s2_901, __p3_901), __s0_901, __p1_901); \
  70836   __ret_901; \
  70837 })
  70838 #else
  70839 #define vcopyq_laneq_f64(__p0_902, __p1_902, __p2_902, __p3_902) __extension__ ({ \
  70840   float64x2_t __ret_902; \
  70841   float64x2_t __s0_902 = __p0_902; \
  70842   float64x2_t __s2_902 = __p2_902; \
  70843   float64x2_t __rev0_902;  __rev0_902 = __builtin_shufflevector(__s0_902, __s0_902, 1, 0); \
  70844   float64x2_t __rev2_902;  __rev2_902 = __builtin_shufflevector(__s2_902, __s2_902, 1, 0); \
  70845   __ret_902 = __noswap_vsetq_lane_f64(__noswap_vgetq_lane_f64(__rev2_902, __p3_902), __rev0_902, __p1_902); \
  70846   __ret_902 = __builtin_shufflevector(__ret_902, __ret_902, 1, 0); \
  70847   __ret_902; \
  70848 })
  70849 #endif
  70850 
  70851 #ifdef __LITTLE_ENDIAN__
  70852 #define vcopy_laneq_p64(__p0_903, __p1_903, __p2_903, __p3_903) __extension__ ({ \
  70853   poly64x1_t __ret_903; \
  70854   poly64x1_t __s0_903 = __p0_903; \
  70855   poly64x2_t __s2_903 = __p2_903; \
  70856   __ret_903 = vset_lane_p64(vgetq_lane_p64(__s2_903, __p3_903), __s0_903, __p1_903); \
  70857   __ret_903; \
  70858 })
  70859 #else
  70860 #define vcopy_laneq_p64(__p0_904, __p1_904, __p2_904, __p3_904) __extension__ ({ \
  70861   poly64x1_t __ret_904; \
  70862   poly64x1_t __s0_904 = __p0_904; \
  70863   poly64x2_t __s2_904 = __p2_904; \
  70864   poly64x2_t __rev2_904;  __rev2_904 = __builtin_shufflevector(__s2_904, __s2_904, 1, 0); \
  70865   __ret_904 = vset_lane_p64(__noswap_vgetq_lane_p64(__rev2_904, __p3_904), __s0_904, __p1_904); \
  70866   __ret_904; \
  70867 })
  70868 #endif
  70869 
  70870 #ifdef __LITTLE_ENDIAN__
  70871 #define vcopy_laneq_f64(__p0_905, __p1_905, __p2_905, __p3_905) __extension__ ({ \
  70872   float64x1_t __ret_905; \
  70873   float64x1_t __s0_905 = __p0_905; \
  70874   float64x2_t __s2_905 = __p2_905; \
  70875   __ret_905 = vset_lane_f64(vgetq_lane_f64(__s2_905, __p3_905), __s0_905, __p1_905); \
  70876   __ret_905; \
  70877 })
  70878 #else
  70879 #define vcopy_laneq_f64(__p0_906, __p1_906, __p2_906, __p3_906) __extension__ ({ \
  70880   float64x1_t __ret_906; \
  70881   float64x1_t __s0_906 = __p0_906; \
  70882   float64x2_t __s2_906 = __p2_906; \
  70883   float64x2_t __rev2_906;  __rev2_906 = __builtin_shufflevector(__s2_906, __s2_906, 1, 0); \
  70884   __ret_906 = vset_lane_f64(__noswap_vgetq_lane_f64(__rev2_906, __p3_906), __s0_906, __p1_906); \
  70885   __ret_906; \
  70886 })
  70887 #endif
  70888 
  70889 #ifdef __LITTLE_ENDIAN__
  70890 __ai __attribute__((target("neon"))) uint16x8_t vmlal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  70891   uint16x8_t __ret;
  70892   __ret = vmlal_u8(__p0, vget_high_u8(__p1), vget_high_u8(__p2));
  70893   return __ret;
  70894 }
  70895 #else
  70896 __ai __attribute__((target("neon"))) uint16x8_t vmlal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  70897   uint16x8_t __ret;
  70898   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70899   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70900   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70901   __ret = __noswap_vmlal_u8(__rev0, __noswap_vget_high_u8(__rev1), __noswap_vget_high_u8(__rev2));
  70902   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70903   return __ret;
  70904 }
  70905 #endif
  70906 
  70907 #ifdef __LITTLE_ENDIAN__
  70908 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  70909   uint64x2_t __ret;
  70910   __ret = vmlal_u32(__p0, vget_high_u32(__p1), vget_high_u32(__p2));
  70911   return __ret;
  70912 }
  70913 #else
  70914 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  70915   uint64x2_t __ret;
  70916   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  70917   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70918   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  70919   __ret = __noswap_vmlal_u32(__rev0, __noswap_vget_high_u32(__rev1), __noswap_vget_high_u32(__rev2));
  70920   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70921   return __ret;
  70922 }
  70923 #endif
  70924 
  70925 #ifdef __LITTLE_ENDIAN__
  70926 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  70927   uint32x4_t __ret;
  70928   __ret = vmlal_u16(__p0, vget_high_u16(__p1), vget_high_u16(__p2));
  70929   return __ret;
  70930 }
  70931 #else
  70932 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  70933   uint32x4_t __ret;
  70934   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70935   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70936   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  70937   __ret = __noswap_vmlal_u16(__rev0, __noswap_vget_high_u16(__rev1), __noswap_vget_high_u16(__rev2));
  70938   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70939   return __ret;
  70940 }
  70941 #endif
  70942 
  70943 #ifdef __LITTLE_ENDIAN__
  70944 __ai __attribute__((target("neon"))) int16x8_t vmlal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) {
  70945   int16x8_t __ret;
  70946   __ret = vmlal_s8(__p0, vget_high_s8(__p1), vget_high_s8(__p2));
  70947   return __ret;
  70948 }
  70949 #else
  70950 __ai __attribute__((target("neon"))) int16x8_t vmlal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) {
  70951   int16x8_t __ret;
  70952   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  70953   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70954   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  70955   __ret = __noswap_vmlal_s8(__rev0, __noswap_vget_high_s8(__rev1), __noswap_vget_high_s8(__rev2));
  70956   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  70957   return __ret;
  70958 }
  70959 #endif
  70960 
  70961 #ifdef __LITTLE_ENDIAN__
  70962 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  70963   int64x2_t __ret;
  70964   __ret = vmlal_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2));
  70965   return __ret;
  70966 }
  70967 #else
  70968 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  70969   int64x2_t __ret;
  70970   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  70971   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  70972   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  70973   __ret = __noswap_vmlal_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2));
  70974   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  70975   return __ret;
  70976 }
  70977 #endif
  70978 
  70979 #ifdef __LITTLE_ENDIAN__
  70980 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  70981   int32x4_t __ret;
  70982   __ret = vmlal_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2));
  70983   return __ret;
  70984 }
  70985 #else
  70986 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  70987   int32x4_t __ret;
  70988   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  70989   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  70990   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  70991   __ret = __noswap_vmlal_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2));
  70992   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  70993   return __ret;
  70994 }
  70995 #endif
  70996 
  70997 #ifdef __LITTLE_ENDIAN__
  70998 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) {
  70999   uint64x2_t __ret;
  71000   __ret = vmlal_n_u32(__p0, vget_high_u32(__p1), __p2);
  71001   return __ret;
  71002 }
  71003 #else
  71004 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) {
  71005   uint64x2_t __ret;
  71006   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71007   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71008   __ret = __noswap_vmlal_n_u32(__rev0, __noswap_vget_high_u32(__rev1), __p2);
  71009   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71010   return __ret;
  71011 }
  71012 #endif
  71013 
  71014 #ifdef __LITTLE_ENDIAN__
  71015 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) {
  71016   uint32x4_t __ret;
  71017   __ret = vmlal_n_u16(__p0, vget_high_u16(__p1), __p2);
  71018   return __ret;
  71019 }
  71020 #else
  71021 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) {
  71022   uint32x4_t __ret;
  71023   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71024   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71025   __ret = __noswap_vmlal_n_u16(__rev0, __noswap_vget_high_u16(__rev1), __p2);
  71026   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71027   return __ret;
  71028 }
  71029 #endif
  71030 
  71031 #ifdef __LITTLE_ENDIAN__
  71032 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  71033   int64x2_t __ret;
  71034   __ret = vmlal_n_s32(__p0, vget_high_s32(__p1), __p2);
  71035   return __ret;
  71036 }
  71037 #else
  71038 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  71039   int64x2_t __ret;
  71040   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71041   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71042   __ret = __noswap_vmlal_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2);
  71043   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71044   return __ret;
  71045 }
  71046 #endif
  71047 
  71048 #ifdef __LITTLE_ENDIAN__
  71049 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  71050   int32x4_t __ret;
  71051   __ret = vmlal_n_s16(__p0, vget_high_s16(__p1), __p2);
  71052   return __ret;
  71053 }
  71054 #else
  71055 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  71056   int32x4_t __ret;
  71057   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71058   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71059   __ret = __noswap_vmlal_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2);
  71060   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71061   return __ret;
  71062 }
  71063 #endif
  71064 
  71065 #ifdef __LITTLE_ENDIAN__
  71066 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  71067   uint16x8_t __ret;
  71068   __ret = vmlsl_u8(__p0, vget_high_u8(__p1), vget_high_u8(__p2));
  71069   return __ret;
  71070 }
  71071 #else
  71072 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  71073   uint16x8_t __ret;
  71074   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  71075   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71076   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71077   __ret = __noswap_vmlsl_u8(__rev0, __noswap_vget_high_u8(__rev1), __noswap_vget_high_u8(__rev2));
  71078   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  71079   return __ret;
  71080 }
  71081 #endif
  71082 
  71083 #ifdef __LITTLE_ENDIAN__
  71084 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  71085   uint64x2_t __ret;
  71086   __ret = vmlsl_u32(__p0, vget_high_u32(__p1), vget_high_u32(__p2));
  71087   return __ret;
  71088 }
  71089 #else
  71090 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  71091   uint64x2_t __ret;
  71092   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71093   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71094   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  71095   __ret = __noswap_vmlsl_u32(__rev0, __noswap_vget_high_u32(__rev1), __noswap_vget_high_u32(__rev2));
  71096   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71097   return __ret;
  71098 }
  71099 #endif
  71100 
  71101 #ifdef __LITTLE_ENDIAN__
  71102 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  71103   uint32x4_t __ret;
  71104   __ret = vmlsl_u16(__p0, vget_high_u16(__p1), vget_high_u16(__p2));
  71105   return __ret;
  71106 }
  71107 #else
  71108 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  71109   uint32x4_t __ret;
  71110   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71111   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71112   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  71113   __ret = __noswap_vmlsl_u16(__rev0, __noswap_vget_high_u16(__rev1), __noswap_vget_high_u16(__rev2));
  71114   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71115   return __ret;
  71116 }
  71117 #endif
  71118 
  71119 #ifdef __LITTLE_ENDIAN__
  71120 __ai __attribute__((target("neon"))) int16x8_t vmlsl_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) {
  71121   int16x8_t __ret;
  71122   __ret = vmlsl_s8(__p0, vget_high_s8(__p1), vget_high_s8(__p2));
  71123   return __ret;
  71124 }
  71125 #else
  71126 __ai __attribute__((target("neon"))) int16x8_t vmlsl_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) {
  71127   int16x8_t __ret;
  71128   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  71129   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71130   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71131   __ret = __noswap_vmlsl_s8(__rev0, __noswap_vget_high_s8(__rev1), __noswap_vget_high_s8(__rev2));
  71132   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  71133   return __ret;
  71134 }
  71135 #endif
  71136 
  71137 #ifdef __LITTLE_ENDIAN__
  71138 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  71139   int64x2_t __ret;
  71140   __ret = vmlsl_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2));
  71141   return __ret;
  71142 }
  71143 #else
  71144 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  71145   int64x2_t __ret;
  71146   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71147   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71148   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  71149   __ret = __noswap_vmlsl_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2));
  71150   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71151   return __ret;
  71152 }
  71153 #endif
  71154 
  71155 #ifdef __LITTLE_ENDIAN__
  71156 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  71157   int32x4_t __ret;
  71158   __ret = vmlsl_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2));
  71159   return __ret;
  71160 }
  71161 #else
  71162 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  71163   int32x4_t __ret;
  71164   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71165   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71166   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  71167   __ret = __noswap_vmlsl_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2));
  71168   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71169   return __ret;
  71170 }
  71171 #endif
  71172 
  71173 #ifdef __LITTLE_ENDIAN__
  71174 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) {
  71175   uint64x2_t __ret;
  71176   __ret = vmlsl_n_u32(__p0, vget_high_u32(__p1), __p2);
  71177   return __ret;
  71178 }
  71179 #else
  71180 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) {
  71181   uint64x2_t __ret;
  71182   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71183   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71184   __ret = __noswap_vmlsl_n_u32(__rev0, __noswap_vget_high_u32(__rev1), __p2);
  71185   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71186   return __ret;
  71187 }
  71188 #endif
  71189 
  71190 #ifdef __LITTLE_ENDIAN__
  71191 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) {
  71192   uint32x4_t __ret;
  71193   __ret = vmlsl_n_u16(__p0, vget_high_u16(__p1), __p2);
  71194   return __ret;
  71195 }
  71196 #else
  71197 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) {
  71198   uint32x4_t __ret;
  71199   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71200   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71201   __ret = __noswap_vmlsl_n_u16(__rev0, __noswap_vget_high_u16(__rev1), __p2);
  71202   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71203   return __ret;
  71204 }
  71205 #endif
  71206 
  71207 #ifdef __LITTLE_ENDIAN__
  71208 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  71209   int64x2_t __ret;
  71210   __ret = vmlsl_n_s32(__p0, vget_high_s32(__p1), __p2);
  71211   return __ret;
  71212 }
  71213 #else
  71214 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) {
  71215   int64x2_t __ret;
  71216   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71217   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71218   __ret = __noswap_vmlsl_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2);
  71219   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71220   return __ret;
  71221 }
  71222 #endif
  71223 
  71224 #ifdef __LITTLE_ENDIAN__
  71225 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  71226   int32x4_t __ret;
  71227   __ret = vmlsl_n_s16(__p0, vget_high_s16(__p1), __p2);
  71228   return __ret;
  71229 }
  71230 #else
  71231 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) {
  71232   int32x4_t __ret;
  71233   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71234   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71235   __ret = __noswap_vmlsl_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2);
  71236   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71237   return __ret;
  71238 }
  71239 #endif
  71240 
  71241 #define vmulx_lane_f64(__p0_907, __p1_907, __p2_907) __extension__ ({ \
  71242   float64x1_t __ret_907; \
  71243   float64x1_t __s0_907 = __p0_907; \
  71244   float64x1_t __s1_907 = __p1_907; \
  71245   float64_t __x_907 = vget_lane_f64(__s0_907, 0); \
  71246   float64_t __y_907 = vget_lane_f64(__s1_907, __p2_907); \
  71247   float64_t __z_907 = vmulxd_f64(__x_907, __y_907); \
  71248   __ret_907 = vset_lane_f64(__z_907, __s0_907, __p2_907); \
  71249   __ret_907; \
  71250 })
  71251 #ifdef __LITTLE_ENDIAN__
  71252 #define vmulx_laneq_f64(__p0_908, __p1_908, __p2_908) __extension__ ({ \
  71253   float64x1_t __ret_908; \
  71254   float64x1_t __s0_908 = __p0_908; \
  71255   float64x2_t __s1_908 = __p1_908; \
  71256   float64_t __x_908 = vget_lane_f64(__s0_908, 0); \
  71257   float64_t __y_908 = vgetq_lane_f64(__s1_908, __p2_908); \
  71258   float64_t __z_908 = vmulxd_f64(__x_908, __y_908); \
  71259   __ret_908 = vset_lane_f64(__z_908, __s0_908, 0); \
  71260   __ret_908; \
  71261 })
  71262 #else
  71263 #define vmulx_laneq_f64(__p0_909, __p1_909, __p2_909) __extension__ ({ \
  71264   float64x1_t __ret_909; \
  71265   float64x1_t __s0_909 = __p0_909; \
  71266   float64x2_t __s1_909 = __p1_909; \
  71267   float64x2_t __rev1_909;  __rev1_909 = __builtin_shufflevector(__s1_909, __s1_909, 1, 0); \
  71268   float64_t __x_909 = vget_lane_f64(__s0_909, 0); \
  71269   float64_t __y_909 = __noswap_vgetq_lane_f64(__rev1_909, __p2_909); \
  71270   float64_t __z_909 = vmulxd_f64(__x_909, __y_909); \
  71271   __ret_909 = vset_lane_f64(__z_909, __s0_909, 0); \
  71272   __ret_909; \
  71273 })
  71274 #endif
  71275 
  71276 #endif
  71277 #ifdef __LITTLE_ENDIAN__
  71278 __ai __attribute__((target("neon"))) uint16x8_t vabal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  71279   uint16x8_t __ret;
  71280   __ret = __p0 + vabdl_u8(__p1, __p2);
  71281   return __ret;
  71282 }
  71283 #else
  71284 __ai __attribute__((target("neon"))) uint16x8_t vabal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  71285   uint16x8_t __ret;
  71286   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  71287   uint8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71288   uint8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  71289   __ret = __rev0 + __noswap_vabdl_u8(__rev1, __rev2);
  71290   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  71291   return __ret;
  71292 }
  71293 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vabal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) {
  71294   uint16x8_t __ret;
  71295   __ret = __p0 + __noswap_vabdl_u8(__p1, __p2);
  71296   return __ret;
  71297 }
  71298 #endif
  71299 
  71300 #ifdef __LITTLE_ENDIAN__
  71301 __ai __attribute__((target("neon"))) uint64x2_t vabal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  71302   uint64x2_t __ret;
  71303   __ret = __p0 + vabdl_u32(__p1, __p2);
  71304   return __ret;
  71305 }
  71306 #else
  71307 __ai __attribute__((target("neon"))) uint64x2_t vabal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  71308   uint64x2_t __ret;
  71309   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71310   uint32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  71311   uint32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  71312   __ret = __rev0 + __noswap_vabdl_u32(__rev1, __rev2);
  71313   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71314   return __ret;
  71315 }
  71316 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vabal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) {
  71317   uint64x2_t __ret;
  71318   __ret = __p0 + __noswap_vabdl_u32(__p1, __p2);
  71319   return __ret;
  71320 }
  71321 #endif
  71322 
  71323 #ifdef __LITTLE_ENDIAN__
  71324 __ai __attribute__((target("neon"))) uint32x4_t vabal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  71325   uint32x4_t __ret;
  71326   __ret = __p0 + vabdl_u16(__p1, __p2);
  71327   return __ret;
  71328 }
  71329 #else
  71330 __ai __attribute__((target("neon"))) uint32x4_t vabal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  71331   uint32x4_t __ret;
  71332   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71333   uint16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71334   uint16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  71335   __ret = __rev0 + __noswap_vabdl_u16(__rev1, __rev2);
  71336   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71337   return __ret;
  71338 }
  71339 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vabal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) {
  71340   uint32x4_t __ret;
  71341   __ret = __p0 + __noswap_vabdl_u16(__p1, __p2);
  71342   return __ret;
  71343 }
  71344 #endif
  71345 
  71346 #ifdef __LITTLE_ENDIAN__
  71347 __ai __attribute__((target("neon"))) int16x8_t vabal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  71348   int16x8_t __ret;
  71349   __ret = __p0 + vabdl_s8(__p1, __p2);
  71350   return __ret;
  71351 }
  71352 #else
  71353 __ai __attribute__((target("neon"))) int16x8_t vabal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  71354   int16x8_t __ret;
  71355   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  71356   int8x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71357   int8x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  71358   __ret = __rev0 + __noswap_vabdl_s8(__rev1, __rev2);
  71359   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  71360   return __ret;
  71361 }
  71362 __ai __attribute__((target("neon"))) int16x8_t __noswap_vabal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) {
  71363   int16x8_t __ret;
  71364   __ret = __p0 + __noswap_vabdl_s8(__p1, __p2);
  71365   return __ret;
  71366 }
  71367 #endif
  71368 
  71369 #ifdef __LITTLE_ENDIAN__
  71370 __ai __attribute__((target("neon"))) int64x2_t vabal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  71371   int64x2_t __ret;
  71372   __ret = __p0 + vabdl_s32(__p1, __p2);
  71373   return __ret;
  71374 }
  71375 #else
  71376 __ai __attribute__((target("neon"))) int64x2_t vabal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  71377   int64x2_t __ret;
  71378   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71379   int32x2_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0);
  71380   int32x2_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0);
  71381   __ret = __rev0 + __noswap_vabdl_s32(__rev1, __rev2);
  71382   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71383   return __ret;
  71384 }
  71385 __ai __attribute__((target("neon"))) int64x2_t __noswap_vabal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) {
  71386   int64x2_t __ret;
  71387   __ret = __p0 + __noswap_vabdl_s32(__p1, __p2);
  71388   return __ret;
  71389 }
  71390 #endif
  71391 
  71392 #ifdef __LITTLE_ENDIAN__
  71393 __ai __attribute__((target("neon"))) int32x4_t vabal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  71394   int32x4_t __ret;
  71395   __ret = __p0 + vabdl_s16(__p1, __p2);
  71396   return __ret;
  71397 }
  71398 #else
  71399 __ai __attribute__((target("neon"))) int32x4_t vabal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  71400   int32x4_t __ret;
  71401   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71402   int16x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71403   int16x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  71404   __ret = __rev0 + __noswap_vabdl_s16(__rev1, __rev2);
  71405   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71406   return __ret;
  71407 }
  71408 __ai __attribute__((target("neon"))) int32x4_t __noswap_vabal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) {
  71409   int32x4_t __ret;
  71410   __ret = __p0 + __noswap_vabdl_s16(__p1, __p2);
  71411   return __ret;
  71412 }
  71413 #endif
  71414 
  71415 #if defined(__aarch64__) || defined(__arm64ec__)
  71416 #ifdef __LITTLE_ENDIAN__
  71417 __ai __attribute__((target("neon"))) uint16x8_t vabal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  71418   uint16x8_t __ret;
  71419   __ret = vabal_u8(__p0, vget_high_u8(__p1), vget_high_u8(__p2));
  71420   return __ret;
  71421 }
  71422 #else
  71423 __ai __attribute__((target("neon"))) uint16x8_t vabal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) {
  71424   uint16x8_t __ret;
  71425   uint16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  71426   uint8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71427   uint8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71428   __ret = __noswap_vabal_u8(__rev0, __noswap_vget_high_u8(__rev1), __noswap_vget_high_u8(__rev2));
  71429   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  71430   return __ret;
  71431 }
  71432 #endif
  71433 
  71434 #ifdef __LITTLE_ENDIAN__
  71435 __ai __attribute__((target("neon"))) uint64x2_t vabal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  71436   uint64x2_t __ret;
  71437   __ret = vabal_u32(__p0, vget_high_u32(__p1), vget_high_u32(__p2));
  71438   return __ret;
  71439 }
  71440 #else
  71441 __ai __attribute__((target("neon"))) uint64x2_t vabal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) {
  71442   uint64x2_t __ret;
  71443   uint64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71444   uint32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71445   uint32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  71446   __ret = __noswap_vabal_u32(__rev0, __noswap_vget_high_u32(__rev1), __noswap_vget_high_u32(__rev2));
  71447   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71448   return __ret;
  71449 }
  71450 #endif
  71451 
  71452 #ifdef __LITTLE_ENDIAN__
  71453 __ai __attribute__((target("neon"))) uint32x4_t vabal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  71454   uint32x4_t __ret;
  71455   __ret = vabal_u16(__p0, vget_high_u16(__p1), vget_high_u16(__p2));
  71456   return __ret;
  71457 }
  71458 #else
  71459 __ai __attribute__((target("neon"))) uint32x4_t vabal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) {
  71460   uint32x4_t __ret;
  71461   uint32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71462   uint16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71463   uint16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  71464   __ret = __noswap_vabal_u16(__rev0, __noswap_vget_high_u16(__rev1), __noswap_vget_high_u16(__rev2));
  71465   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71466   return __ret;
  71467 }
  71468 #endif
  71469 
  71470 #ifdef __LITTLE_ENDIAN__
  71471 __ai __attribute__((target("neon"))) int16x8_t vabal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) {
  71472   int16x8_t __ret;
  71473   __ret = vabal_s8(__p0, vget_high_s8(__p1), vget_high_s8(__p2));
  71474   return __ret;
  71475 }
  71476 #else
  71477 __ai __attribute__((target("neon"))) int16x8_t vabal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) {
  71478   int16x8_t __ret;
  71479   int16x8_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0);
  71480   int8x16_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71481   int8x16_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
  71482   __ret = __noswap_vabal_s8(__rev0, __noswap_vget_high_s8(__rev1), __noswap_vget_high_s8(__rev2));
  71483   __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0);
  71484   return __ret;
  71485 }
  71486 #endif
  71487 
  71488 #ifdef __LITTLE_ENDIAN__
  71489 __ai __attribute__((target("neon"))) int64x2_t vabal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  71490   int64x2_t __ret;
  71491   __ret = vabal_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2));
  71492   return __ret;
  71493 }
  71494 #else
  71495 __ai __attribute__((target("neon"))) int64x2_t vabal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) {
  71496   int64x2_t __ret;
  71497   int64x2_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0);
  71498   int32x4_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0);
  71499   int32x4_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0);
  71500   __ret = __noswap_vabal_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2));
  71501   __ret = __builtin_shufflevector(__ret, __ret, 1, 0);
  71502   return __ret;
  71503 }
  71504 #endif
  71505 
  71506 #ifdef __LITTLE_ENDIAN__
  71507 __ai __attribute__((target("neon"))) int32x4_t vabal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  71508   int32x4_t __ret;
  71509   __ret = vabal_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2));
  71510   return __ret;
  71511 }
  71512 #else
  71513 __ai __attribute__((target("neon"))) int32x4_t vabal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) {
  71514   int32x4_t __ret;
  71515   int32x4_t __rev0;  __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0);
  71516   int16x8_t __rev1;  __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0);
  71517   int16x8_t __rev2;  __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0);
  71518   __ret = __noswap_vabal_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2));
  71519   __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0);
  71520   return __ret;
  71521 }
  71522 #endif
  71523 
  71524 #endif
  71525 
  71526 #undef __ai
  71527 
  71528 #endif /* if !defined(__ARM_NEON) */
  71529 #endif /* ifndef __ARM_FP */