@@ -938,22 +938,36 @@ impl<'a, 'gcc, 'tcx> BuilderMethods<'a, 'tcx> for Builder<'a, 'gcc, 'tcx> {
938
938
fn load ( & mut self , pointee_ty : Type < ' gcc > , ptr : RValue < ' gcc > , align : Align ) -> RValue < ' gcc > {
939
939
let block = self . llbb ( ) ;
940
940
let function = block. get_function ( ) ;
941
+ // NOTE(FractalFir): In some cases, we *should* skip the call to get_aligned.
942
+ // For example, calling `get_aligned` on a i8 is pointless(since it can only be 1 aligned)
943
+ // Calling get_aligned on a `u128`/`i128` causes the attribute to become "stacked"
944
+ //
945
+ // From GCCs perspective:
946
+ // __int128_t __attribute__((aligned(16))) __attribute__((aligned(16)))
947
+ // and:
948
+ // __int128_t __attribute__((aligned(16)))
949
+ // are 2 distinct, incompatible types.
950
+ //
951
+ // So, we skip the call to `get_aligned` in such a case. *Ideally*, we could do this for all the types,
952
+ // but the GCC APIs to facilitate this just aren't quite there yet.
953
+
954
+ // This checks that we only skip `get_aligned` on 128 bit ints if they have the correct alignment.
955
+ // Otherwise, this may be an under-aligned load, so we will still call get_aligned.
956
+ let mut can_skip_align = ( pointee_ty == self . cx . u128_type
957
+ || pointee_ty == self . cx . i128_type )
958
+ && align == self . int128_align ;
959
+ // We can skip the call to `get_aligned` for byte-sized types with alignment of 1.
960
+ can_skip_align = can_skip_align
961
+ || ( pointee_ty == self . cx . u8_type || pointee_ty == self . cx . i8_type )
962
+ && align. bytes ( ) == 1 ;
963
+ // Skip the call to `get_aligned` when possible.
964
+ let aligned_type =
965
+ if can_skip_align { pointee_ty } else { pointee_ty. get_aligned ( align. bytes ( ) ) } ;
966
+
967
+ let ptr = self . context . new_cast ( self . location , ptr, aligned_type. make_pointer ( ) ) ;
941
968
// NOTE: instead of returning the dereference here, we have to assign it to a variable in
942
969
// the current basic block. Otherwise, it could be used in another basic block, causing a
943
970
// dereference after a drop, for instance.
944
- // FIXME(antoyo): this check that we don't call get_aligned() a second time on a type.
945
- // Ideally, we shouldn't need to do this check.
946
- // FractalFir: the `align == self.int128_align` check ensures we *do* call `get_aligned` if
947
- // the alignment of a `u128`/`i128` is not the one mandated by the ABI. This ensures we handle
948
- // under-aligned loads correctly.
949
- let aligned_type = if ( pointee_ty == self . cx . u128_type || pointee_ty == self . cx . i128_type )
950
- && align == self . int128_align
951
- {
952
- pointee_ty
953
- } else {
954
- pointee_ty. get_aligned ( align. bytes ( ) )
955
- } ;
956
- let ptr = self . context . new_cast ( self . location , ptr, aligned_type. make_pointer ( ) ) ;
957
971
let deref = ptr. dereference ( self . location ) . to_rvalue ( ) ;
958
972
let loaded_value = function. new_local (
959
973
self . location ,
0 commit comments