rust-lang · Jamesbarford · Apr 17, 2026 · Apr 17, 2026 · Apr 17, 2026 · Apr 21, 2026
diff --git a/compiler/rustc_codegen_llvm/src/attributes.rs b/compiler/rustc_codegen_llvm/src/attributes.rs
@@ -39,25 +39,23 @@ pub(crate) fn remove_string_attr_from_llfn(llfn: &Value, name: &str) {
     llvm::RemoveStringAttrFromFn(llfn, name);
 }
 
-/// Get LLVM attribute for the provided inline heuristic.
-pub(crate) fn inline_attr<'ll, 'tcx>(
+/// Get LLVM attribute for the provided inline heuristic that can be applied
+/// to a function definition
+fn inline_attr_for_fn_def<'ll, 'tcx>(
     cx: &SimpleCx<'ll>,
     tcx: TyCtxt<'tcx>,
     instance: ty::Instance<'tcx>,
+    has_function_features: bool,
 ) -> Option<&'ll Attribute> {
-    // `optnone` requires `noinline`
-    let codegen_fn_attrs = tcx.codegen_fn_attrs(instance.def_id());
-    let inline = match (codegen_fn_attrs.inline, &codegen_fn_attrs.optimize) {
-        (_, OptimizeAttr::DoNotOptimize) => InlineAttr::Never,
-        (InlineAttr::None, _) if instance.def.requires_inline(tcx) => InlineAttr::Hint,
-        (inline, _) => inline,
-    };
-
     if !tcx.sess.opts.unstable_opts.inline_llvm {
         // disable LLVM inlining
         return Some(AttributeKind::NoInline.create_attr(cx.llcx));
     }
-    match inline {
+
+    let codegen_fn_attrs = tcx.codegen_fn_attrs(instance.def_id());
+    let inline = get_inline_attr_from_codegen_fn_attrs(tcx, codegen_fn_attrs, instance);
+
+    let llvm_attr = match inline {
         InlineAttr::Hint => Some(AttributeKind::InlineHint.create_attr(cx.llcx)),
         InlineAttr::Always | InlineAttr::Force { .. } => {
             Some(AttributeKind::AlwaysInline.create_attr(cx.llcx))
@@ -70,7 +68,58 @@ pub(crate) fn inline_attr<'ll, 'tcx>(
             }
         }
         InlineAttr::None => None,
+    };
+
+    let is_inline_always = is_inline_always_attr(inline);
+    // Keep non-`#[inline(always)]` attributes on the function definition as
+    // usual. `#[inline(always)]` can also stay on the function when there are
+    // no per-function target features.
+    //
+    // Once a function has target features, we avoid attaching `alwaysinline`
+    // to the definition itself. In that case the attribute is checked and,
+    // when legal, emitted on individual call sites instead.
+    if !is_inline_always || (is_inline_always && !has_function_features) { llvm_attr } else { None }
+}
+
+/// Get the `InlineAttr` for the given instance.
+fn get_inline_attr_from_codegen_fn_attrs<'tcx>(
+    tcx: TyCtxt<'tcx>,
+    codegen_fn_attrs: &CodegenFnAttrs,
+    instance: ty::Instance<'tcx>,
+) -> InlineAttr {
+    // `optnone` requires `noinline`
+    match (codegen_fn_attrs.inline, &codegen_fn_attrs.optimize) {
+        (_, OptimizeAttr::DoNotOptimize) => InlineAttr::Never,
+        (InlineAttr::None, _) if instance.def.requires_inline(tcx) => InlineAttr::Hint,
+        (inline, _) => inline,
+    }
+}
+
+#[inline]
+fn is_inline_always_attr(inline_attr: InlineAttr) -> bool {
+    matches!(inline_attr, InlineAttr::Always | InlineAttr::Force { .. })
+}
+
+/// Do we have an LLVM inline always attribute for the callsite?
+pub(crate) fn has_inline_always_callsite_attribute<'tcx>(
+    tcx: TyCtxt<'tcx>,
+    attrs: &CodegenFnAttrs,
+    instance: ty::Instance<'tcx>,
+) -> bool {
+    // disable LLVM inlining
+    if !tcx.sess.opts.unstable_opts.inline_llvm {
+        return false;
     }
+
+    // If there are no target features on the function then we do not want to
+    // return anything. As the attribute will have been applied to the function
+    // definition.
+    if attrs.target_features.is_empty() {
+        return false;
+    }
+
+    // We are only interested in the `#[inline(always)]` attribute
+    is_inline_always_attr(get_inline_attr_from_codegen_fn_attrs(tcx, attrs, instance))
 }
 
 #[inline]
@@ -534,14 +583,11 @@ pub(crate) fn llfn_attrs_from_instance<'ll, 'tcx>(
     let function_features =
         codegen_fn_attrs.target_features.iter().map(|f| f.name.as_str()).collect::<Vec<&str>>();
 
-    // Apply function attributes as per usual if there are no user defined
-    // target features otherwise this will get applied at the callsite.
-    if function_features.is_empty() {
-        if let Some(instance) = instance
-            && let Some(inline_attr) = inline_attr(cx, tcx, instance)
-        {
-            to_add.push(inline_attr);
-        }
+    if let Some(instance) = instance
+        && let Some(inline_attr) =
+            inline_attr_for_fn_def(cx, tcx, instance, !function_features.is_empty())
+    {
+        to_add.push(inline_attr);
     }
 
     let function_features = function_features

diff --git a/compiler/rustc_codegen_llvm/src/builder.rs b/compiler/rustc_codegen_llvm/src/builder.rs
@@ -16,7 +16,7 @@ use rustc_codegen_ssa::mir::place::PlaceRef;
 use rustc_codegen_ssa::traits::*;
 use rustc_data_structures::small_c_str::SmallCStr;
 use rustc_hir::def_id::DefId;
-use rustc_middle::middle::codegen_fn_attrs::{CodegenFnAttrs, TargetFeature, TargetFeatureKind};
+use rustc_middle::middle::codegen_fn_attrs::CodegenFnAttrs;
 use rustc_middle::ty::layout::{
     FnAbiError, FnAbiOfHelpers, FnAbiRequest, HasTypingEnv, LayoutError, LayoutOfHelpers,
     TyAndLayout,
@@ -31,12 +31,12 @@ use smallvec::SmallVec;
 use tracing::{debug, instrument};
 
 use crate::abi::FnAbiLlvmExt;
-use crate::attributes;
+use crate::attributes::{self};
 use crate::common::Funclet;
 use crate::context::{CodegenCx, FullCx, GenericCx, SCx};
 use crate::llvm::{
-    self, AtomicOrdering, AtomicRmwBinOp, BasicBlock, FromGeneric, GEPNoWrapFlags, Metadata, TRUE,
-    ToLlvmBool, Type, Value,
+    self, AtomicOrdering, AtomicRmwBinOp, AttributeKind, BasicBlock, FromGeneric, GEPNoWrapFlags,
+    Metadata, TRUE, ToLlvmBool, Type, Value,
 };
 use crate::type_of::LayoutLlvmExt;
 
@@ -1427,29 +1427,38 @@ impl<'a, 'll, 'tcx> BuilderMethods<'a, 'tcx> for Builder<'a, 'll, 'tcx> {
             )
         };
 
-        if let Some(callee_instance) = callee_instance {
+        // Check for whether we can add `#[inline(always)]` to a callsite
+        if let (Some(callee_instance), Some(caller_attrs)) = (callee_instance, caller_attrs) {
             // Attributes on the function definition being called
             let callee_attrs = self.cx.tcx.codegen_fn_attrs(callee_instance.def_id());
-            if let Some(caller_attrs) = caller_attrs
-                // If there is an inline attribute and a target feature that matches
-                // we will add the attribute to the callsite otherwise we'll omit
-                // this and not add the attribute to prevent soundness issues.
-                && let Some(inlining_rule) = attributes::inline_attr(&self.cx, self.cx.tcx, callee_instance)
-                && self.cx.tcx.is_target_feature_call_safe(
+
+            // Only propagate `#[inline(always)]` to the callsite when there is
+            // an attribute and the caller and callee are compatible for
+            // inlining here. Otherwise we explicitly emit a `noinline` to
+            // ensure that the function will not get inlined through an LLVM
+            // pass.
+            if attributes::has_inline_always_callsite_attribute(
+                self.cx.tcx,
+                callee_attrs,
+                callee_instance,
+            ) {
+                if self.tcx.is_call_inline_able_at_callsite(
                     &callee_attrs.target_features,
-                    &caller_attrs.target_features.iter().cloned().chain(
-                        self.cx.tcx.sess.target_features.iter().map(|feat| TargetFeature {
-                            name: *feat,
-                            kind: TargetFeatureKind::Implied,
-                        })
-                    ).collect::<Vec<_>>(),
-                )
-            {
-                attributes::apply_to_callsite(
-                    call,
-                    llvm::AttributePlace::Function,
-                    &[inlining_rule],
-                );
+                    &caller_attrs.target_features,
+                ) {
+                    attributes::apply_to_callsite(
+                        call,
+                        llvm::AttributePlace::Function,
+                        &[AttributeKind::AlwaysInline.create_attr(self.cx.llcx)],
+                    );
+                } else {
+                    // Ensure the function call will not be inlined.
+                    attributes::apply_to_callsite(
+                        call,
+                        llvm::AttributePlace::Function,
+                        &[AttributeKind::NoInline.create_attr(self.cx.llcx)],
+                    );
+                }
             }
         }
 

diff --git a/compiler/rustc_middle/src/ty/context.rs b/compiler/rustc_middle/src/ty/context.rs
@@ -19,7 +19,7 @@ use rustc_abi::{ExternAbi, FieldIdx, Layout, LayoutData, TargetDataLayout, Varia
 use rustc_ast as ast;
 use rustc_data_structures::defer;
 use rustc_data_structures::fingerprint::Fingerprint;
-use rustc_data_structures::fx::FxHashMap;
+use rustc_data_structures::fx::{FxHashMap, FxIndexSet};
 use rustc_data_structures::intern::Interned;
 use rustc_data_structures::jobserver::Proxy;
 use rustc_data_structures::profiling::SelfProfilerRef;
@@ -1321,6 +1321,58 @@ impl<'tcx> TyCtxt<'tcx> {
                 .all(|feature| body_features.iter().any(|f| f.name == feature.name))
     }
 
+    /// Returns whether a callee can safely be always inlined into a caller at
+    /// this callsite.
+    ///
+    /// This requires more than "the caller has at least the callee's target
+    /// features". We also require the caller and callee to agree on any
+    /// target features that affect the vector ABI, otherwise inlining could
+    /// reinterpret arguments under a different calling convention.
+    pub fn is_call_inline_able_at_callsite(
+        self,
+        callee_features: &[TargetFeature],
+        caller_features: &[TargetFeature],
+    ) -> bool {
+        // Fold in globally enabled target features, since they are part of the
+        // effective feature set for both sides.
+        let callee_features = self.effective_inline_target_features(callee_features);
+        let caller_features = self.effective_inline_target_features(caller_features);
+
+        // A plain subset check is not sufficient. For example, `avx`
+        // implicitly enables `sse`, so a callee that only requires `sse`
+        // appears to be a subset of an `avx` caller. However, `avx` also
+        // changes how vector arguments are passed, so inlining that callee into
+        // the caller would cross an ABI boundary. Require both the feature
+        // subset relation and matching ABI-relevant vector features.
+        self.vector_abi_matches(&callee_features, &caller_features)
+            && callee_features.is_subset(&caller_features)
+    }
+
+    fn vector_abi_matches(
+        self,
+        callee_features: &FxIndexSet<Symbol>,
+        caller_features: &FxIndexSet<Symbol>,
+    ) -> bool {
+        self.abi_target_features(caller_features) == self.abi_target_features(callee_features)
+    }
+
+    pub fn abi_target_features(self, feature_names: &FxIndexSet<Symbol>) -> FxIndexSet<Symbol> {
+        feature_names
+            .iter()
+            .cloned()
+            .filter(|it| self.sess.target.feature_could_influence_vector_length(it.as_str()))
+            .collect()
+    }
+
+    pub fn effective_inline_target_features(
+        self,
+        features: &[TargetFeature],
+    ) -> FxIndexSet<Symbol> {
+        let mut all_features = self.sess.unstable_target_features.clone();
+        all_features.extend(features.iter().map(|it| it.name));
+        all_features
+    }
+
     /// Returns the safe version of the signature of the given function, if calling it
     /// would be safe in the context of the given caller.
     pub fn adjust_target_feature_sig(

diff --git a/compiler/rustc_mir_transform/src/check_inline_always_target_features.rs b/compiler/rustc_mir_transform/src/check_inline_always_target_features.rs
@@ -1,5 +1,5 @@
 use rustc_hir::attrs::InlineAttr;
-use rustc_middle::middle::codegen_fn_attrs::{TargetFeature, TargetFeatureKind};
+use rustc_middle::middle::codegen_fn_attrs::TargetFeatureKind;
 use rustc_middle::mir::{Body, TerminatorKind};
 use rustc_middle::ty::{self, TyCtxt};
 
@@ -51,36 +51,83 @@ fn check_inline_always_target_features<'tcx>(tcx: TyCtxt<'tcx>, body: &Body<'tcx
 
                 // Scan the users defined target features and ensure they
                 // match the caller.
-                if tcx.is_target_feature_call_safe(
+                if tcx.is_call_inline_able_at_callsite(
                     &callee_codegen_fn_attrs.target_features,
-                    &caller_codegen_fn_attrs
-                        .target_features
-                        .iter()
-                        .cloned()
-                        .chain(tcx.sess.target_features.iter().map(|feat| TargetFeature {
-                            name: *feat,
-                            kind: TargetFeatureKind::Implied,
-                        }))
-                        .collect::<Vec<_>>(),
+                    &caller_codegen_fn_attrs.target_features,
                 ) {
                     continue;
                 }
 
-                let callee_only: Vec<_> = callee_codegen_fn_attrs
+                // Use the full target feature sets, including implied and
+                // command-line features, to classify the mismatch. Diagnostic
+                // messages should still only mention the non-implied features
+                // that the user actually enabled.
+                let caller_features =
+                    tcx.effective_inline_target_features(&caller_codegen_fn_attrs.target_features);
+                let callee_features =
+                    tcx.effective_inline_target_features(&callee_codegen_fn_attrs.target_features);
+
+                let explicit_caller_features: Vec<_> = caller_codegen_fn_attrs
+                    .target_features
+                    .iter()
+                    .cloned()
+                    .filter(|it| it.kind != TargetFeatureKind::Implied)
+                    .collect();
+                let explicit_callee_features: Vec<_> = callee_codegen_fn_attrs
                     .target_features
                     .iter()
-                    .filter(|it| !caller_codegen_fn_attrs.target_features.contains(it))
-                    .filter(|it| !matches!(it.kind, TargetFeatureKind::Implied))
-                    .map(|it| it.name.as_str())
+                    .cloned()
+                    .filter(|it| it.kind != TargetFeatureKind::Implied)
                     .collect();
 
-                crate::errors::emit_inline_always_target_feature_diagnostic(
-                    tcx,
-                    terminator.source_info.span,
-                    callee_def_id,
-                    caller_def_id.into(),
-                    &callee_only,
-                );
+                let explicit_caller_features =
+                    tcx.effective_inline_target_features(&explicit_caller_features);
+                let explicit_callee_features =
+                    tcx.effective_inline_target_features(&explicit_callee_features);
+
+                // If the callee's features are otherwise a subset of the
+                // caller's, then the mismatch is only due to the caller using a
+                // different vector ABI from the callee.
+                if callee_features.is_subset(&caller_features) {
+                    // We only want to display the target features the user
+                    // missed out. Not every feature that is possibly enabled.
+                    let caller_abi_features = tcx.abi_target_features(&explicit_caller_features);
+                    let callee_abi_features = tcx.abi_target_features(&explicit_callee_features);
+                    let caller_only = caller_abi_features
+                        .difference(&callee_abi_features)
+                        .map(|it| it.as_str())
+                        .collect::<Vec<_>>()
+                        .join(", ");
+
+                    // Emit that the issue is caused by a vector ABI mismatch.
+                    crate::errors::emit_inline_always_target_feature_diagnostic(
+                        tcx,
+                        terminator.source_info.span,
+                        callee_def_id,
+                        caller_def_id.into(),
+                        &caller_only,
+                        caller_def_id.into(),
+                        callee_def_id,
+                    );
+                } else {
+                    let callee_only = explicit_callee_features
+                        .difference(&explicit_caller_features)
+                        .map(|it| it.as_str())
+                        .collect::<Vec<_>>()
+                        .join(", ");
+
+                    // Emit that the issue stems from the callee having features
+                    // enabled that the caller does not have enabled.
+                    crate::errors::emit_inline_always_target_feature_diagnostic(
+                        tcx,
+                        terminator.source_info.span,
+                        callee_def_id,
+                        caller_def_id.into(),
+                        &callee_only,
+                        callee_def_id,
+                        caller_def_id.into(),
+                    );
+                }
             }
             _ => (),
         }