| /* GNU compiler vector extension intrinsics |
| Copyright (C) 2015-2022 Free Software Foundation, Inc. |
| Contributed by Andreas Krebbel (Andreas.Krebbel@de.ibm.com) |
| |
| This file is part of GCC. |
| |
| GCC is free software; you can redistribute it and/or modify it under |
| the terms of the GNU General Public License as published by the Free |
| Software Foundation; either version 3, or (at your option) any later |
| version. |
| |
| GCC is distributed in the hope that it will be useful, but WITHOUT ANY |
| WARRANTY; without even the implied warranty of MERCHANTABILITY or |
| FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
| for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with GCC; see the file COPYING3. If not see |
| <http://www.gnu.org/licenses/>. */ |
| |
| #ifndef _VECINTRIN_H |
| #define _VECINTRIN_H |
| |
| #define __VEC_CLASS_FP_ZERO_P (1<<11) |
| #define __VEC_CLASS_FP_ZERO_N (1<<10) |
| #define __VEC_CLASS_FP_ZERO (__VEC_CLASS_FP_ZERO_P \ |
| | __VEC_CLASS_FP_ZERO_N) |
| |
| #define __VEC_CLASS_FP_NORMAL_P (1<<9) |
| #define __VEC_CLASS_FP_NORMAL_N (1<<8) |
| #define __VEC_CLASS_FP_NORMAL (__VEC_CLASS_FP_NORMAL_P \ |
| | __VEC_CLASS_FP_NORMAL_N) |
| |
| #define __VEC_CLASS_FP_SUBNORMAL_P (1<<7) |
| #define __VEC_CLASS_FP_SUBNORMAL_N (1<<6) |
| #define __VEC_CLASS_FP_SUBNORMAL (__VEC_CLASS_FP_SUBNORMAL_P \ |
| | __VEC_CLASS_FP_SUBNORMAL_N) |
| |
| #define __VEC_CLASS_FP_INFINITY_P (1<<5) |
| #define __VEC_CLASS_FP_INFINITY_N (1<<4) |
| #define __VEC_CLASS_FP_INFINITY (__VEC_CLASS_FP_INFINITY_P \ |
| | __VEC_CLASS_FP_INFINITY_N) |
| |
| #define __VEC_CLASS_FP_QNAN_P (1<<3) |
| #define __VEC_CLASS_FP_QNAN_N (1<<2) |
| #define __VEC_CLASS_FP_QNAN (__VEC_CLASS_FP_QNAN_P \ |
| | __VEC_CLASS_FP_QNAN_N) |
| |
| #define __VEC_CLASS_FP_SNAN_P (1<<1) |
| #define __VEC_CLASS_FP_SNAN_N (1<<0) |
| #define __VEC_CLASS_FP_SNAN (__VEC_CLASS_FP_SNAN_P \ |
| | __VEC_CLASS_FP_SNAN_N) |
| |
| #define __VEC_CLASS_FP_NAN (__VEC_CLASS_FP_QNAN \ |
| | __VEC_CLASS_FP_SNAN) |
| #define __VEC_CLASS_FP_NOT_NORMAL (__VEC_CLASS_FP_NAN \ |
| | __VEC_CLASS_FP_SUBNORMAL \ |
| |__VEC_CLASS_FP_ZERO \ |
| | __VEC_CLASS_FP_INFINITY) |
| |
| /* This also accepts a type for its parameter, so it is not enough |
| to #define vec_step to __builtin_vec_step. */ |
| #define vec_step(x) __builtin_vec_step (* (__typeof__ (x) *) 0) |
| |
| static inline int |
| __lcbb(const void *ptr, int bndry) |
| { |
| int code; |
| switch (bndry) |
| { |
| case 64: code = 0; break; |
| case 128: code = 1; break; |
| case 256: code = 2; break; |
| case 512: code = 3; break; |
| case 1024: code = 4; break; |
| case 2048: code = 5; break; |
| case 4096: code = 6; break; |
| default: return 0; |
| } |
| return __builtin_s390_lcbb (ptr, code); |
| } |
| |
| #define vec_all_nle(X, Y) vec_all_nge ((Y), (X)) |
| #define vec_all_nlt(X, Y) vec_all_ngt ((Y), (X)) |
| #define vec_any_nle(X, Y) vec_any_nge ((Y), (X)) |
| #define vec_any_nlt(X, Y) vec_any_ngt ((Y), (X)) |
| #define vec_genmask __builtin_s390_vgbm |
| #define vec_genmasks_8 __builtin_s390_vgmb |
| #define vec_genmasks_16 __builtin_s390_vgmh |
| #define vec_genmasks_32 __builtin_s390_vgmf |
| #define vec_genmasks_64 __builtin_s390_vgmg |
| #define vec_splat_u8 __builtin_s390_vec_splat_u8 |
| #define vec_splat_s8 __builtin_s390_vec_splat_s8 |
| #define vec_splat_u16 __builtin_s390_vec_splat_u16 |
| #define vec_splat_s16 __builtin_s390_vec_splat_s16 |
| #define vec_splat_u32 __builtin_s390_vec_splat_u32 |
| #define vec_splat_s32 __builtin_s390_vec_splat_s32 |
| #define vec_splat_u64 __builtin_s390_vec_splat_u64 |
| #define vec_splat_s64 __builtin_s390_vec_splat_s64 |
| #define vec_checksum __builtin_s390_vcksm |
| #define vec_gfmsum_128 __builtin_s390_vgfmg |
| #define vec_gfmsum_accum_128 __builtin_s390_vgfmag |
| #define vec_ceil(X) __builtin_s390_vfi((X), 4, 6) |
| #define vec_roundp(X) __builtin_s390_vfi((X), 4, 6) |
| #define vec_floor(X) __builtin_s390_vfi((X), 4, 7) |
| #define vec_roundm(X) __builtin_s390_vfi((X), 4, 7) |
| #define vec_trunc(X) __builtin_s390_vfi((X), 4, 5) |
| #define vec_roundz(X) __builtin_s390_vfi((X), 4, 5) |
| #define vec_rint(X) __builtin_s390_vfi((X), 0, 0) |
| #define vec_roundc(X) __builtin_s390_vfi((X), 4, 0) |
| #define vec_round(X) __builtin_s390_vfi((X), 4, 4) |
| #define vec_doublee(X) __builtin_s390_vflls((X)) |
| #define vec_floate(X) __builtin_s390_vflrd((X), 0, 0) |
| #define vec_load_len_r(X,L) \ |
| (__vector unsigned char)__builtin_s390_vlrlr((L),(X)) |
| #define vec_store_len_r(X,Y,L) \ |
| __builtin_s390_vstrlr((__vector signed char)(X),(L),(Y)) |
| |
| #define vec_all_nan(a) \ |
| __extension__ ({ \ |
| int __cc; \ |
| __builtin_s390_vec_fp_test_data_class (a, \ |
| __VEC_CLASS_FP_QNAN \ |
| | __VEC_CLASS_FP_QNAN_N \ |
| | __VEC_CLASS_FP_SNAN \ |
| | __VEC_CLASS_FP_SNAN_N, &__cc); \ |
| __cc == 0 ? 1 : 0; \ |
| }) |
| |
| #define vec_all_numeric(a) \ |
| __extension__ ({ \ |
| int __cc; \ |
| __builtin_s390_vec_fp_test_data_class (a, \ |
| __VEC_CLASS_FP_NORMAL \ |
| | __VEC_CLASS_FP_NORMAL_N \ |
| | __VEC_CLASS_FP_SUBNORMAL \ |
| | __VEC_CLASS_FP_SUBNORMAL_N, &__cc); \ |
| __cc == 0 ? 1 : 0; \ |
| }) |
| |
| #define vec_any_nan(a) \ |
| __extension__ ({ \ |
| int __cc; \ |
| __builtin_s390_vec_fp_test_data_class (a, \ |
| __VEC_CLASS_FP_QNAN \ |
| | __VEC_CLASS_FP_QNAN_N \ |
| | __VEC_CLASS_FP_SNAN \ |
| | __VEC_CLASS_FP_SNAN_N, &cc); \ |
| cc != 3 ? 1 : 0; \ |
| }) |
| |
| #define vec_any_numeric(a) \ |
| __extension__ ({ \ |
| int __cc; \ |
| __builtin_s390_vec_fp_test_data_class (a, \ |
| __VEC_CLASS_FP_NORMAL \ |
| | __VEC_CLASS_FP_NORMAL_N \ |
| | __VEC_CLASS_FP_SUBNORMAL \ |
| | __VEC_CLASS_FP_SUBNORMAL_N, &cc); \ |
| cc != 3 ? 1 : 0; \ |
| }) |
| |
| #define vec_vstbrh vec_vlbrh |
| #define vec_vstbrf vec_vlbrf |
| #define vec_vstbrg vec_vlbrg |
| #define vec_vstbrq vec_vlbrq |
| #define vec_vstbrf_flt vec_vlbrf_flt |
| #define vec_vstbrg_dbl vec_vlbrg_dbl |
| |
| #define vec_vsterb vec_vlerb |
| #define vec_vsterh vec_vlerh |
| #define vec_vsterf vec_vlerh |
| #define vec_vsterg vec_vlerh |
| #define vec_vsterf_flt vec_vlerf_flt |
| #define vec_vsterg_dbl vec_vlerg_dbl |
| |
| #define vec_extend_to_fp32_hi __builtin_s390_vclfnhs |
| #define vec_extend_to_fp32_lo __builtin_s390_vclfnls |
| #define vec_round_from_fp32 __builtin_s390_vcrnfs |
| #define vec_convert_to_fp16 __builtin_s390_vcfn |
| #define vec_convert_from_fp16 __builtin_s390_vcnf |
| #define vec_gather_element __builtin_s390_vec_gather_element |
| #define vec_xl __builtin_s390_vec_xl |
| #define vec_xld2 __builtin_s390_vec_xld2 |
| #define vec_xlw4 __builtin_s390_vec_xlw4 |
| #define vec_splats __builtin_s390_vec_splats |
| #define vec_insert __builtin_s390_vec_insert |
| #define vec_promote __builtin_s390_vec_promote |
| #define vec_extract __builtin_s390_vec_extract |
| #define vec_insert_and_zero __builtin_s390_vec_insert_and_zero |
| #define vec_load_bndry __builtin_s390_vec_load_bndry |
| #define vec_load_pair __builtin_s390_vec_load_pair |
| #define vec_load_len __builtin_s390_vec_load_len |
| #define vec_mergeh __builtin_s390_vec_mergeh |
| #define vec_mergel __builtin_s390_vec_mergel |
| #define vec_pack __builtin_s390_vec_pack |
| #define vec_packs __builtin_s390_vec_packs |
| #define vec_packs_cc __builtin_s390_vec_packs_cc |
| #define vec_packsu __builtin_s390_vec_packsu |
| #define vec_packsu_cc __builtin_s390_vec_packsu_cc |
| #define vec_perm __builtin_s390_vec_perm |
| #define vec_permi __builtin_s390_vec_permi |
| #define vec_splat __builtin_s390_vec_splat |
| #define vec_scatter_element __builtin_s390_vec_scatter_element |
| #define vec_sel __builtin_s390_vec_sel |
| #define vec_extend_s64 __builtin_s390_vec_extend_s64 |
| #define vec_xst __builtin_s390_vec_xst |
| #define vec_xstd2 __builtin_s390_vec_xstd2 |
| #define vec_xstw4 __builtin_s390_vec_xstw4 |
| #define vec_store_len __builtin_s390_vec_store_len |
| #define vec_bperm_u128 __builtin_s390_vec_bperm_u128 |
| #define vec_unpackh __builtin_s390_vec_unpackh |
| #define vec_unpackl __builtin_s390_vec_unpackl |
| #define vec_addc __builtin_s390_vec_addc |
| #define vec_add_u128 __builtin_s390_vec_add_u128 |
| #define vec_addc_u128 __builtin_s390_vec_addc_u128 |
| #define vec_adde_u128 __builtin_s390_vec_adde_u128 |
| #define vec_addec_u128 __builtin_s390_vec_addec_u128 |
| #define vec_and __builtin_s390_vec_and |
| #define vec_andc __builtin_s390_vec_andc |
| #define vec_avg __builtin_s390_vec_avg |
| #define vec_all_eq __builtin_s390_vec_all_eq |
| #define vec_all_ne __builtin_s390_vec_all_ne |
| #define vec_all_ge __builtin_s390_vec_all_ge |
| #define vec_all_gt __builtin_s390_vec_all_gt |
| #define vec_all_le __builtin_s390_vec_all_le |
| #define vec_all_lt __builtin_s390_vec_all_lt |
| #define vec_any_eq __builtin_s390_vec_any_eq |
| #define vec_any_ne __builtin_s390_vec_any_ne |
| #define vec_any_ge __builtin_s390_vec_any_ge |
| #define vec_any_gt __builtin_s390_vec_any_gt |
| #define vec_any_le __builtin_s390_vec_any_le |
| #define vec_any_lt __builtin_s390_vec_any_lt |
| #define vec_cmpeq __builtin_s390_vec_cmpeq |
| #define vec_cmpge __builtin_s390_vec_cmpge |
| #define vec_cmpgt __builtin_s390_vec_cmpgt |
| #define vec_cmple __builtin_s390_vec_cmple |
| #define vec_cmplt __builtin_s390_vec_cmplt |
| #define vec_cntlz __builtin_s390_vec_cntlz |
| #define vec_cnttz __builtin_s390_vec_cnttz |
| #define vec_xor __builtin_s390_vec_xor |
| #define vec_gfmsum __builtin_s390_vec_gfmsum |
| #define vec_gfmsum_accum __builtin_s390_vec_gfmsum_accum |
| #define vec_abs __builtin_s390_vec_abs |
| #define vec_max __builtin_s390_vec_max |
| #define vec_min __builtin_s390_vec_min |
| #define vec_mladd __builtin_s390_vec_mladd |
| #define vec_mhadd __builtin_s390_vec_mhadd |
| #define vec_meadd __builtin_s390_vec_meadd |
| #define vec_moadd __builtin_s390_vec_moadd |
| #define vec_mulh __builtin_s390_vec_mulh |
| #define vec_mule __builtin_s390_vec_mule |
| #define vec_mulo __builtin_s390_vec_mulo |
| #define vec_nor __builtin_s390_vec_nor |
| #define vec_or __builtin_s390_vec_or |
| #define vec_popcnt __builtin_s390_vec_popcnt |
| #define vec_rl __builtin_s390_vec_rl |
| #define vec_rli __builtin_s390_vec_rli |
| #define vec_rl_mask __builtin_s390_vec_rl_mask |
| #define vec_sll __builtin_s390_vec_sll |
| #define vec_slb __builtin_s390_vec_slb |
| #define vec_sld __builtin_s390_vec_sld |
| #define vec_sldw __builtin_s390_vec_sldw |
| #define vec_sral __builtin_s390_vec_sral |
| #define vec_srab __builtin_s390_vec_srab |
| #define vec_srl __builtin_s390_vec_srl |
| #define vec_srb __builtin_s390_vec_srb |
| #define vec_subc __builtin_s390_vec_subc |
| #define vec_sub_u128 __builtin_s390_vec_sub_u128 |
| #define vec_subc_u128 __builtin_s390_vec_subc_u128 |
| #define vec_sube_u128 __builtin_s390_vec_sube_u128 |
| #define vec_subec_u128 __builtin_s390_vec_subec_u128 |
| #define vec_sum2 __builtin_s390_vec_sum2 |
| #define vec_sum_u128 __builtin_s390_vec_sum_u128 |
| #define vec_sum4 __builtin_s390_vec_sum4 |
| #define vec_test_mask __builtin_s390_vec_test_mask |
| #define vec_msum_u128 __builtin_s390_vec_msum_u128 |
| #define vec_eqv __builtin_s390_vec_eqv |
| #define vec_nand __builtin_s390_vec_nand |
| #define vec_orc __builtin_s390_vec_orc |
| #define vec_find_any_eq_idx __builtin_s390_vec_find_any_eq_idx |
| #define vec_find_any_ne_idx __builtin_s390_vec_find_any_ne_idx |
| #define vec_find_any_eq_or_0_idx __builtin_s390_vec_find_any_eq_or_0_idx |
| #define vec_find_any_ne_or_0_idx __builtin_s390_vec_find_any_ne_or_0_idx |
| #define vec_find_any_eq __builtin_s390_vec_find_any_eq |
| #define vec_find_any_ne __builtin_s390_vec_find_any_ne |
| #define vec_find_any_eq_idx_cc __builtin_s390_vec_find_any_eq_idx_cc |
| #define vec_find_any_ne_idx_cc __builtin_s390_vec_find_any_ne_idx_cc |
| #define vec_find_any_eq_or_0_idx_cc __builtin_s390_vec_find_any_eq_or_0_idx_cc |
| #define vec_find_any_ne_or_0_idx_cc __builtin_s390_vec_find_any_ne_or_0_idx_cc |
| #define vec_find_any_eq_cc __builtin_s390_vec_find_any_eq_cc |
| #define vec_find_any_ne_cc __builtin_s390_vec_find_any_ne_cc |
| #define vec_cmpeq_idx __builtin_s390_vec_cmpeq_idx |
| #define vec_cmpeq_or_0_idx __builtin_s390_vec_cmpeq_or_0_idx |
| #define vec_cmpeq_idx_cc __builtin_s390_vec_cmpeq_idx_cc |
| #define vec_cmpeq_or_0_idx_cc __builtin_s390_vec_cmpeq_or_0_idx_cc |
| #define vec_cmpne_idx __builtin_s390_vec_cmpne_idx |
| #define vec_cmpne_or_0_idx __builtin_s390_vec_cmpne_or_0_idx |
| #define vec_cmpne_idx_cc __builtin_s390_vec_cmpne_idx_cc |
| #define vec_cmpne_or_0_idx_cc __builtin_s390_vec_cmpne_or_0_idx_cc |
| #define vec_cp_until_zero __builtin_s390_vec_cp_until_zero |
| #define vec_cp_until_zero_cc __builtin_s390_vec_cp_until_zero_cc |
| #define vec_cmprg_idx __builtin_s390_vec_cmprg_idx |
| #define vec_cmpnrg_idx __builtin_s390_vec_cmpnrg_idx |
| #define vec_cmprg_or_0_idx __builtin_s390_vec_cmprg_or_0_idx |
| #define vec_cmpnrg_or_0_idx __builtin_s390_vec_cmpnrg_or_0_idx |
| #define vec_cmprg __builtin_s390_vec_cmprg |
| #define vec_cmpnrg __builtin_s390_vec_cmpnrg |
| #define vec_cmprg_idx_cc __builtin_s390_vec_cmprg_idx_cc |
| #define vec_cmpnrg_idx_cc __builtin_s390_vec_cmpnrg_idx_cc |
| #define vec_cmprg_or_0_idx_cc __builtin_s390_vec_cmprg_or_0_idx_cc |
| #define vec_cmpnrg_or_0_idx_cc __builtin_s390_vec_cmpnrg_or_0_idx_cc |
| #define vec_cmprg_cc __builtin_s390_vec_cmprg_cc |
| #define vec_cmpnrg_cc __builtin_s390_vec_cmpnrg_cc |
| #define vec_all_nge __builtin_s390_vec_all_nge |
| #define vec_all_ngt __builtin_s390_vec_all_ngt |
| #define vec_any_nge __builtin_s390_vec_any_nge |
| #define vec_any_ngt __builtin_s390_vec_any_ngt |
| #define vec_ctd __builtin_s390_vec_ctd |
| #define vec_ctd_s64 __builtin_s390_vec_ctd_s64 |
| #define vec_ctd_u64 __builtin_s390_vec_ctd_u64 |
| #define vec_ctsl __builtin_s390_vec_ctsl |
| #define vec_ctul __builtin_s390_vec_ctul |
| #define vec_float __builtin_s390_vec_float |
| #define vec_double __builtin_s390_vec_double |
| #define vec_signed __builtin_s390_vec_signed |
| #define vec_unsigned __builtin_s390_vec_unsigned |
| #define vec_ld2f __builtin_s390_vec_ld2f |
| #define vec_st2f __builtin_s390_vec_st2f |
| #define vec_madd __builtin_s390_vec_madd |
| #define vec_msub __builtin_s390_vec_msub |
| #define vec_nmadd __builtin_s390_vec_nmadd |
| #define vec_nmsub __builtin_s390_vec_nmsub |
| #define vec_nabs __builtin_s390_vec_nabs |
| #define vec_sqrt __builtin_s390_vec_sqrt |
| #define vec_fp_test_data_class __builtin_s390_vec_fp_test_data_class |
| #define vec_revb __builtin_s390_vec_revb |
| #define vec_reve __builtin_s390_vec_reve |
| #define vec_sldb __builtin_s390_vec_sldb |
| #define vec_srdb __builtin_s390_vec_srdb |
| #define vec_search_string_cc __builtin_s390_vec_search_string_cc |
| #define vec_search_string_until_zero_cc __builtin_s390_vec_search_string_until_zero_cc |
| #endif /* _VECINTRIN_H */ |