@@ -309,7 +309,7 @@ impl<'ll, 'tcx> ArgAbiBuilderMethods<'tcx> for Builder<'_, 'll, 'tcx> {
309309}
310310
311311pub ( crate ) trait FnAbiLlvmExt < ' ll , ' tcx > {
312- fn llvm_type ( & self , cx : & CodegenCx < ' ll , ' tcx > ) -> & ' ll Type ;
312+ fn llvm_type ( & self , cx : & CodegenCx < ' ll , ' tcx > , name : & str ) -> & ' ll Type ;
313313 fn ptr_to_llvm_type ( & self , cx : & CodegenCx < ' ll , ' tcx > ) -> & ' ll Type ;
314314 fn llvm_cconv ( & self , cx : & CodegenCx < ' ll , ' tcx > ) -> llvm:: CallConv ;
315315
@@ -326,20 +326,17 @@ pub(crate) trait FnAbiLlvmExt<'ll, 'tcx> {
326326}
327327
328328impl < ' ll , ' tcx > FnAbiLlvmExt < ' ll , ' tcx > for FnAbi < ' tcx , Ty < ' tcx > > {
329- fn llvm_type ( & self , cx : & CodegenCx < ' ll , ' tcx > ) -> & ' ll Type {
329+ fn llvm_type ( & self , cx : & CodegenCx < ' ll , ' tcx > , name : & str ) -> & ' ll Type {
330+ debug ! ( "Getting LLVM type for {} with ABI {:?}" , name, self ) ;
330331 // Ignore "extra" args from the call site for C variadic functions.
331332 // Only the "fixed" args are part of the LLVM function signature.
332333 let args =
333334 if self . c_variadic { & self . args [ ..self . fixed_count as usize ] } else { & self . args } ;
334335
335336 let adjust_ty = |ty| {
336- // todo: rectify this to be more selective (help wanted)
337- let probably_unadjusted = self . conv == Conv :: C && !self . can_unwind && !self . c_variadic ;
338- let probably_amx_intrinsic = probably_unadjusted && cx. tcx . sess . target . arch == "x86_64" ;
337+ let amx_intrinsic = name. starts_with ( "llvm.x86." ) && name. ends_with ( ".internal" ) ;
339338 // Change type to `x86amx` from `i32x256` for x86_64 AMX intrinsics
340- if probably_amx_intrinsic
341- && cx. type_kind ( ty) == TypeKind :: Vector
342- && cx. vector_length ( ty) == 256
339+ if amx_intrinsic && cx. type_kind ( ty) == TypeKind :: Vector && cx. vector_length ( ty) == 256
343340 {
344341 let element_ty = cx. element_type ( ty) ;
345342 if cx. type_kind ( element_ty) == TypeKind :: Integer && cx. int_width ( element_ty) == 32 {
0 commit comments