Skip to content

Commit cf6f6ee

Browse files
authored
Rollup merge of rust-lang#147404 - JamieCunliffe:inline-always, r=jackh726
Fix issue with callsite inline attribute not being applied sometimes. If the calling function had more target features enabled than the callee than the attribute wasn't being applied as the arguments for the check had been swapped round. Also includes target features that are part of the global set as the warning was checking those but when adding the attribute they were not checked. Add a codegen-llvm test to check that the attribute is actually applied as previously only the warning was being checked. Tracking issue: rust-lang#145574
2 parents ceb7df7 + e2c5c18 commit cf6f6ee

File tree

3 files changed

+50
-3
lines changed

3 files changed

+50
-3
lines changed

compiler/rustc_codegen_llvm/src/builder.rs

Lines changed: 7 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ use rustc_codegen_ssa::mir::place::PlaceRef;
1616
use rustc_codegen_ssa::traits::*;
1717
use rustc_data_structures::small_c_str::SmallCStr;
1818
use rustc_hir::def_id::DefId;
19-
use rustc_middle::middle::codegen_fn_attrs::CodegenFnAttrs;
19+
use rustc_middle::middle::codegen_fn_attrs::{CodegenFnAttrs, TargetFeature, TargetFeatureKind};
2020
use rustc_middle::ty::layout::{
2121
FnAbiError, FnAbiOfHelpers, FnAbiRequest, HasTypingEnv, LayoutError, LayoutOfHelpers,
2222
TyAndLayout,
@@ -1417,14 +1417,18 @@ impl<'a, 'll, 'tcx> BuilderMethods<'a, 'tcx> for Builder<'a, 'll, 'tcx> {
14171417
// Attributes on the function definition being called
14181418
let fn_defn_attrs = self.cx.tcx.codegen_fn_attrs(instance.def_id());
14191419
if let Some(fn_call_attrs) = fn_call_attrs
1420-
&& !fn_call_attrs.target_features.is_empty()
14211420
// If there is an inline attribute and a target feature that matches
14221421
// we will add the attribute to the callsite otherwise we'll omit
14231422
// this and not add the attribute to prevent soundness issues.
14241423
&& let Some(inlining_rule) = attributes::inline_attr(&self.cx, self.cx.tcx, instance)
14251424
&& self.cx.tcx.is_target_feature_call_safe(
1426-
&fn_call_attrs.target_features,
14271425
&fn_defn_attrs.target_features,
1426+
&fn_call_attrs.target_features.iter().cloned().chain(
1427+
self.cx.tcx.sess.target_features.iter().map(|feat| TargetFeature {
1428+
name: *feat,
1429+
kind: TargetFeatureKind::Implied,
1430+
})
1431+
).collect::<Vec<_>>(),
14281432
)
14291433
{
14301434
attributes::apply_to_callsite(

compiler/rustc_middle/src/ty/context.rs

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2088,6 +2088,8 @@ impl<'tcx> TyCtxt<'tcx> {
20882088
self.sess.dcx()
20892089
}
20902090

2091+
/// Checks to see if the caller (`body_features`) has all the features required by the callee
2092+
/// (`callee_features`).
20912093
pub fn is_target_feature_call_safe(
20922094
self,
20932095
callee_features: &[TargetFeature],
Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
//@ add-minicore
2+
//@ compile-flags: --target aarch64-unknown-linux-gnu -Zinline-mir=no -C no-prepopulate-passes
3+
//@ needs-llvm-components: aarch64
4+
5+
#![crate_type = "lib"]
6+
#![feature(no_core, lang_items, target_feature_inline_always)]
7+
#![no_core]
8+
9+
extern crate minicore;
10+
use minicore::*;
11+
12+
#[inline(always)]
13+
#[target_feature(enable = "neon")]
14+
#[no_mangle]
15+
pub fn single_target_feature() -> i32 {
16+
42
17+
}
18+
19+
#[inline(always)]
20+
#[target_feature(enable = "neon,i8mm")]
21+
#[no_mangle]
22+
// CHECK: define noundef i32 @multiple_target_features() unnamed_addr #1 {
23+
pub fn multiple_target_features() -> i32 {
24+
// CHECK: %_0 = call noundef i32 @single_target_feature() #3
25+
single_target_feature()
26+
}
27+
28+
#[no_mangle]
29+
// CHECK: define noundef i32 @inherits_from_global() unnamed_addr #2 {
30+
pub fn inherits_from_global() -> i32 {
31+
unsafe {
32+
// CHECK: %_0 = call noundef i32 @single_target_feature() #3
33+
single_target_feature()
34+
}
35+
}
36+
37+
// Attribute #3 requires the alwaysinline attribute, the alwaysinline attribute is not emitted on a
38+
// function definition when target features are present, rather it will be moved onto the function
39+
// call, if the features match up.
40+
//
41+
// CHECK: attributes #3 = { alwaysinline nounwind }

0 commit comments

Comments
 (0)