@@ -223,7 +223,7 @@ def __builtin_amdgcn_alignbit : AMDGPUBuiltin<"unsigned int(unsigned int, unsign
223223def __builtin_amdgcn_alignbyte : AMDGPUBuiltin<" unsigned int(unsigned int, unsigned int, unsigned int)" , [Const]>;
224224def __builtin_amdgcn_ubfe : AMDGPUBuiltin<" unsigned int(unsigned int, unsigned int, unsigned int)" , [Const]>;
225225def __builtin_amdgcn_sbfe : AMDGPUBuiltin<" unsigned int(unsigned int, unsigned int, unsigned int)" , [Const]>;
226- def __builtin_amdgcn_cvt_pkrtz : AMDGPUBuiltin<" _ExtVector<2, _Float16 >(float, float)" , [Const]>;
226+ def __builtin_amdgcn_cvt_pkrtz : AMDGPUBuiltin<" _ExtVector<2, __fp16 >(float, float)" , [Const]>;
227227def __builtin_amdgcn_cvt_pknorm_i16 : AMDGPUBuiltin<" _ExtVector<2, short>(float, float)" , [Const], " cvt-pknorm-vop2-insts" >;
228228def __builtin_amdgcn_cvt_pknorm_u16 : AMDGPUBuiltin<" _ExtVector<2, unsigned short>(float, float)" , [Const], " cvt-pknorm-vop2-insts" >;
229229def __builtin_amdgcn_cvt_pk_i16 : AMDGPUBuiltin<" _ExtVector<2, short>(int, int)" , [Const]>;
@@ -319,7 +319,7 @@ def __builtin_amdgcn_ds_gws_sema_release_all : AMDGPUBuiltin<"void(unsigned int)
319319// Interpolation builtins.
320320// ===----------------------------------------------------------------------===//
321321def __builtin_amdgcn_interp_p1_f16 : AMDGPUBuiltin<" float(float, unsigned int, unsigned int, bool, unsigned int)" , [Const]>;
322- def __builtin_amdgcn_interp_p2_f16 : AMDGPUBuiltin<" _Float16 (float, float, unsigned int, unsigned int, bool, unsigned int)" , [Const]>;
322+ def __builtin_amdgcn_interp_p2_f16 : AMDGPUBuiltin<" __fp16 (float, float, unsigned int, unsigned int, bool, unsigned int)" , [Const]>;
323323def __builtin_amdgcn_interp_p1 : AMDGPUBuiltin<" float(float, unsigned int, unsigned int, unsigned int)" , [Const]>;
324324def __builtin_amdgcn_interp_p2 : AMDGPUBuiltin<" float(float, float, unsigned int, unsigned int, unsigned int)" , [Const]>;
325325def __builtin_amdgcn_interp_mov : AMDGPUBuiltin<" float(unsigned int, unsigned int, unsigned int, unsigned int)" , [Const]>;
@@ -349,7 +349,7 @@ def __builtin_amdgcn_perm : AMDGPUBuiltin<"unsigned int(unsigned int, unsigned i
349349// GFX9+ only builtins.
350350// ===----------------------------------------------------------------------===//
351351
352- def __builtin_amdgcn_fmed3h : AMDGPUBuiltin<" _Float16(_Float16, _Float16, _Float16 )" , [Const], " gfx9-insts" >;
352+ def __builtin_amdgcn_fmed3h : AMDGPUBuiltin<" __fp16(__fp16, __fp16, __fp16 )" , [Const], " gfx9-insts" >;
353353
354354def __builtin_amdgcn_global_atomic_fadd_f64 : AMDGPUBuiltin<" double(double address_space<1> *, double)" , [], " gfx90a-insts" >;
355355def __builtin_amdgcn_global_atomic_fadd_f32 : AMDGPUBuiltin<" float(float address_space<1> *, float)" , [], " atomic-fadd-rtn-insts" >;
@@ -669,7 +669,7 @@ def __builtin_amdgcn_ds_read_tr4_b64_v2i32 : AMDGPUBuiltin<"_ExtVector<2, int>(_
669669def __builtin_amdgcn_ds_read_tr6_b96_v3i32 : AMDGPUBuiltin<" _ExtVector<3, int>(_ExtVector<3, int> address_space<3> *)" , [Const], " gfx950-insts" >;
670670def __builtin_amdgcn_ds_read_tr8_b64_v2i32 : AMDGPUBuiltin<" _ExtVector<2, int>(_ExtVector<2, int> address_space<3> *)" , [Const], " gfx950-insts" >;
671671def __builtin_amdgcn_ds_read_tr16_b64_v4i16 : AMDGPUBuiltin<" _ExtVector<4, short>(_ExtVector<4, short> address_space<3> *)" , [Const], " gfx950-insts" >;
672- def __builtin_amdgcn_ds_read_tr16_b64_v4f16 : AMDGPUBuiltin<" _ExtVector<4, _Float16 >(_ExtVector<4, _Float16 > address_space<3> *)" , [Const], " gfx950-insts" >;
672+ def __builtin_amdgcn_ds_read_tr16_b64_v4f16 : AMDGPUBuiltin<" _ExtVector<4, __fp16 >(_ExtVector<4, __fp16 > address_space<3> *)" , [Const], " gfx950-insts" >;
673673def __builtin_amdgcn_ds_read_tr16_b64_v4bf16 : AMDGPUBuiltin<" _ExtVector<4, __bf16>(_ExtVector<4, __bf16> address_space<3> *)" , [Const], " gfx950-insts" >;
674674
675675def __builtin_amdgcn_ashr_pk_i8_i32 : AMDGPUBuiltin<" unsigned short(unsigned int, unsigned int, unsigned int)" , [Const], " ashr-pk-insts" >;
@@ -699,11 +699,11 @@ def __builtin_amdgcn_s_buffer_prefetch_data : AMDGPUBuiltin<"void(__amdgpu_buffe
699699
700700def __builtin_amdgcn_global_load_tr_b64_v2i32 : AMDGPUBuiltin<" _ExtVector<2, int>(_ExtVector<2, int> address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize32" >;
701701def __builtin_amdgcn_global_load_tr_b128_v8i16 : AMDGPUBuiltin<" _ExtVector<8, short>(_ExtVector<8, short> address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize32" >;
702- def __builtin_amdgcn_global_load_tr_b128_v8f16 : AMDGPUBuiltin<" _ExtVector<8, _Float16 >(_ExtVector<8, _Float16 > address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize32" >;
702+ def __builtin_amdgcn_global_load_tr_b128_v8f16 : AMDGPUBuiltin<" _ExtVector<8, __fp16 >(_ExtVector<8, __fp16 > address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize32" >;
703703def __builtin_amdgcn_global_load_tr_b128_v8bf16 : AMDGPUBuiltin<" _ExtVector<8, __bf16>(_ExtVector<8, __bf16> address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize32" >;
704704def __builtin_amdgcn_global_load_tr_b64_i32 : AMDGPUBuiltin<" int(int address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize64" >;
705705def __builtin_amdgcn_global_load_tr_b128_v4i16 : AMDGPUBuiltin<" _ExtVector<4, short>(_ExtVector<4, short> address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize64" >;
706- def __builtin_amdgcn_global_load_tr_b128_v4f16 : AMDGPUBuiltin<" _ExtVector<4, _Float16 >(_ExtVector<4, _Float16 > address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize64" >;
706+ def __builtin_amdgcn_global_load_tr_b128_v4f16 : AMDGPUBuiltin<" _ExtVector<4, __fp16 >(_ExtVector<4, __fp16 > address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize64" >;
707707def __builtin_amdgcn_global_load_tr_b128_v4bf16 : AMDGPUBuiltin<" _ExtVector<4, __bf16>(_ExtVector<4, __bf16> address_space<1> *)" , [Const], " gfx12-insts,wavefrontsize64" >;
708708
709709def __builtin_amdgcn_ds_bpermute_fi_b32 : AMDGPUBuiltin<" int(int, int)" , [Const], " gfx12-insts" >;
@@ -828,9 +828,9 @@ def __builtin_amdgcn_wmma_i32_16x16x32_iu4_w64_gfx12 : AMDGPUBuiltin<"_ExtVector
828828 let ArgNames = [" a_sign" , " a" , " b_sign" , " b" , " c" , " clamp" ];
829829}
830830
831- def __builtin_amdgcn_swmmac_f32_16x16x32_f16_w32 : AMDGPUBuiltin<" _ExtVector<8, float>(_ExtVector<8, _Float16 >, _ExtVector<16, _Float16 >, _ExtVector<8, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
831+ def __builtin_amdgcn_swmmac_f32_16x16x32_f16_w32 : AMDGPUBuiltin<" _ExtVector<8, float>(_ExtVector<8, __fp16 >, _ExtVector<16, __fp16 >, _ExtVector<8, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
832832def __builtin_amdgcn_swmmac_f32_16x16x32_bf16_w32 : AMDGPUBuiltin<" _ExtVector<8, float>(_ExtVector<8, short>, _ExtVector<16, short>, _ExtVector<8, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
833- def __builtin_amdgcn_swmmac_f16_16x16x32_f16_w32 : AMDGPUBuiltin<" _ExtVector<8, _Float16 >(_ExtVector<8, _Float16 >, _ExtVector<16, _Float16 >, _ExtVector<8, _Float16 >, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
833+ def __builtin_amdgcn_swmmac_f16_16x16x32_f16_w32 : AMDGPUBuiltin<" _ExtVector<8, __fp16 >(_ExtVector<8, __fp16 >, _ExtVector<16, __fp16 >, _ExtVector<8, __fp16 >, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
834834def __builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w32 : AMDGPUBuiltin<" _ExtVector<8, short>(_ExtVector<8, short>, _ExtVector<16, short>, _ExtVector<8, short>, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
835835def __builtin_amdgcn_swmmac_i32_16x16x32_iu8_w32 : AMDGPUBuiltin<" _ExtVector<8, int>(_Constant bool, _ExtVector<2, int>, _Constant bool, _ExtVector<4, int>, _ExtVector<8, int>, int, _Constant bool)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
836836def __builtin_amdgcn_swmmac_i32_16x16x32_iu4_w32 : AMDGPUBuiltin<" _ExtVector<8, int>(_Constant bool, int, _Constant bool, _ExtVector<2, int>, _ExtVector<8, int>, int, _Constant bool)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
@@ -840,9 +840,9 @@ def __builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w32 : AMDGPUBuiltin<"_ExtVector
840840def __builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w32 : AMDGPUBuiltin<" _ExtVector<8, float>(_ExtVector<2, int>, _ExtVector<4, int>, _ExtVector<8, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
841841def __builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w32 : AMDGPUBuiltin<" _ExtVector<8, float>(_ExtVector<2, int>, _ExtVector<4, int>, _ExtVector<8, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize32" >;
842842
843- def __builtin_amdgcn_swmmac_f32_16x16x32_f16_w64 : AMDGPUBuiltin<" _ExtVector<4, float>(_ExtVector<4, _Float16 >, _ExtVector<8, _Float16 >, _ExtVector<4, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
843+ def __builtin_amdgcn_swmmac_f32_16x16x32_f16_w64 : AMDGPUBuiltin<" _ExtVector<4, float>(_ExtVector<4, __fp16 >, _ExtVector<8, __fp16 >, _ExtVector<4, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
844844def __builtin_amdgcn_swmmac_f32_16x16x32_bf16_w64 : AMDGPUBuiltin<" _ExtVector<4, float>(_ExtVector<4, short>, _ExtVector<8, short>, _ExtVector<4, float>, int)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
845- def __builtin_amdgcn_swmmac_f16_16x16x32_f16_w64 : AMDGPUBuiltin<" _ExtVector<4, _Float16 >(_ExtVector<4, _Float16 >, _ExtVector<8, _Float16 >, _ExtVector<4, _Float16 >, int)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
845+ def __builtin_amdgcn_swmmac_f16_16x16x32_f16_w64 : AMDGPUBuiltin<" _ExtVector<4, __fp16 >(_ExtVector<4, __fp16 >, _ExtVector<8, __fp16 >, _ExtVector<4, __fp16 >, int)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
846846def __builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w64 : AMDGPUBuiltin<" _ExtVector<4, short>(_ExtVector<4, short>, _ExtVector<8, short>, _ExtVector<4, short>, int)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
847847def __builtin_amdgcn_swmmac_i32_16x16x32_iu8_w64 : AMDGPUBuiltin<" _ExtVector<4, int>(_Constant bool, int, _Constant bool, _ExtVector<2, int>, _ExtVector<4, int>, int, _Constant bool)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
848848def __builtin_amdgcn_swmmac_i32_16x16x32_iu4_w64 : AMDGPUBuiltin<" _ExtVector<4, int>(_Constant bool, int, _Constant bool, int, _ExtVector<4, int>, int, _Constant bool)" , [Const], " wmma-128b-insts,wavefrontsize64" >;
@@ -947,13 +947,13 @@ def __builtin_amdgcn_global_load_tr4_b64_v2i32 : AMDGPUBuiltin<"_ExtVector<2, in
947947def __builtin_amdgcn_global_load_tr8_b64_v2i32 : AMDGPUBuiltin<" _ExtVector<2, int>(_ExtVector<2, int> address_space<1> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
948948def __builtin_amdgcn_global_load_tr6_b96_v3i32 : AMDGPUBuiltin<" _ExtVector<3, int>(_ExtVector<3, int> address_space<1> *)" , [Const], " transpose-load-f4f6-insts,wavefrontsize32" >;
949949def __builtin_amdgcn_global_load_tr16_b128_v8i16 : AMDGPUBuiltin<" _ExtVector<8, short>(_ExtVector<8, short> address_space<1> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
950- def __builtin_amdgcn_global_load_tr16_b128_v8f16 : AMDGPUBuiltin<" _ExtVector<8, _Float16 >(_ExtVector<8, _Float16 > address_space<1> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
950+ def __builtin_amdgcn_global_load_tr16_b128_v8f16 : AMDGPUBuiltin<" _ExtVector<8, __fp16 >(_ExtVector<8, __fp16 > address_space<1> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
951951def __builtin_amdgcn_global_load_tr16_b128_v8bf16 : AMDGPUBuiltin<" _ExtVector<8, __bf16>(_ExtVector<8, __bf16> address_space<1> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
952952def __builtin_amdgcn_ds_load_tr4_b64_v2i32 : AMDGPUBuiltin<" _ExtVector<2, int>(_ExtVector<2, int> address_space<3> *)" , [Const], " transpose-load-f4f6-insts,wavefrontsize32" >;
953953def __builtin_amdgcn_ds_load_tr8_b64_v2i32 : AMDGPUBuiltin<" _ExtVector<2, int>(_ExtVector<2, int> address_space<3> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
954954def __builtin_amdgcn_ds_load_tr6_b96_v3i32 : AMDGPUBuiltin<" _ExtVector<3, int>(_ExtVector<3, int> address_space<3> *)" , [Const], " transpose-load-f4f6-insts,wavefrontsize32" >;
955955def __builtin_amdgcn_ds_load_tr16_b128_v8i16 : AMDGPUBuiltin<" _ExtVector<8, short>(_ExtVector<8, short> address_space<3> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
956- def __builtin_amdgcn_ds_load_tr16_b128_v8f16 : AMDGPUBuiltin<" _ExtVector<8, _Float16 >(_ExtVector<8, _Float16 > address_space<3> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
956+ def __builtin_amdgcn_ds_load_tr16_b128_v8f16 : AMDGPUBuiltin<" _ExtVector<8, __fp16 >(_ExtVector<8, __fp16 > address_space<3> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
957957def __builtin_amdgcn_ds_load_tr16_b128_v8bf16 : AMDGPUBuiltin<" _ExtVector<8, __bf16>(_ExtVector<8, __bf16> address_space<3> *)" , [Const], " gfx1250-insts,wavefrontsize32" >;
958958
959959def __builtin_amdgcn_s_setprio_inc_wg : AMDGPUBuiltin<" void(_Constant short)" , [], " setprio-inc-wg-inst" >;
@@ -964,7 +964,7 @@ def __builtin_amdgcn_s_wait_asynccnt : AMDGPUBuiltin<"void(_Constant unsigned sh
964964def __builtin_amdgcn_s_wait_tensorcnt : AMDGPUBuiltin<" void(_Constant unsigned short)" , [], " gfx1250-insts" >;
965965
966966def __builtin_amdgcn_tanhf : AMDGPUBuiltin<" float(float)" , [Const], " tanh-insts" >;
967- def __builtin_amdgcn_tanhh : AMDGPUBuiltin<" _Float16(_Float16 )" , [Const], " tanh-insts" >;
967+ def __builtin_amdgcn_tanhh : AMDGPUBuiltin<" __fp16(__fp16 )" , [Const], " tanh-insts" >;
968968def __builtin_amdgcn_tanh_bf16 : AMDGPUBuiltin<" __bf16(__bf16)" , [Const], " bf16-trans-insts" >;
969969def __builtin_amdgcn_rcp_bf16 : AMDGPUBuiltin<" __bf16(__bf16)" , [Const], " bf16-trans-insts" >;
970970def __builtin_amdgcn_sqrt_bf16 : AMDGPUBuiltin<" __bf16(__bf16)" , [Const], " bf16-trans-insts" >;
0 commit comments