@@ -938,22 +938,36 @@ impl<'a, 'gcc, 'tcx> BuilderMethods<'a, 'tcx> for Builder<'a, 'gcc, 'tcx> {
938938 fn load ( & mut self , pointee_ty : Type < ' gcc > , ptr : RValue < ' gcc > , align : Align ) -> RValue < ' gcc > {
939939 let block = self . llbb ( ) ;
940940 let function = block. get_function ( ) ;
941+ // NOTE(FractalFir): In some cases, we *should* skip the call to get_aligned.
942+ // For example, calling `get_aligned` on a i8 is pointless(since it can only be 1 aligned)
943+ // Calling get_aligned on a `u128`/`i128` causes the attribute to become "stacked"
944+ //
945+ // From GCCs perspective:
946+ // __int128_t __attribute__((aligned(16))) __attribute__((aligned(16)))
947+ // and:
948+ // __int128_t __attribute__((aligned(16)))
949+ // are 2 distinct, incompatible types.
950+ //
951+ // So, we skip the call to `get_aligned` in such a case. *Ideally*, we could do this for all the types,
952+ // but the GCC APIs to facilitate this just aren't quite there yet.
953+
954+ // This checks that we only skip `get_aligned` on 128 bit ints if they have the correct alignment.
955+ // Otherwise, this may be an under-aligned load, so we will still call get_aligned.
956+ let mut can_skip_align = ( pointee_ty == self . cx . u128_type
957+ || pointee_ty == self . cx . i128_type )
958+ && align == self . int128_align ;
959+ // We can skip the call to `get_aligned` for byte-sized types with alignment of 1.
960+ can_skip_align = can_skip_align
961+ || ( pointee_ty == self . cx . u8_type || pointee_ty == self . cx . i8_type )
962+ && align. bytes ( ) == 1 ;
963+ // Skip the call to `get_aligned` when possible.
964+ let aligned_type =
965+ if can_skip_align { pointee_ty } else { pointee_ty. get_aligned ( align. bytes ( ) ) } ;
966+
967+ let ptr = self . context . new_cast ( self . location , ptr, aligned_type. make_pointer ( ) ) ;
941968 // NOTE: instead of returning the dereference here, we have to assign it to a variable in
942969 // the current basic block. Otherwise, it could be used in another basic block, causing a
943970 // dereference after a drop, for instance.
944- // FIXME(antoyo): this check that we don't call get_aligned() a second time on a type.
945- // Ideally, we shouldn't need to do this check.
946- // FractalFir: the `align == self.int128_align` check ensures we *do* call `get_aligned` if
947- // the alignment of a `u128`/`i128` is not the one mandated by the ABI. This ensures we handle
948- // under-aligned loads correctly.
949- let aligned_type = if ( pointee_ty == self . cx . u128_type || pointee_ty == self . cx . i128_type )
950- && align == self . int128_align
951- {
952- pointee_ty
953- } else {
954- pointee_ty. get_aligned ( align. bytes ( ) )
955- } ;
956- let ptr = self . context . new_cast ( self . location , ptr, aligned_type. make_pointer ( ) ) ;
957971 let deref = ptr. dereference ( self . location ) . to_rvalue ( ) ;
958972 let loaded_value = function. new_local (
959973 self . location ,
0 commit comments