Skip to content

Commit a44a20e

Browse files
committed
Windows x86: Change i128 to return via the vector ABI
Clang and GCC both return `i128` in xmm0 on windows-msvc and windows-gnu. Currently, Rust returns the type on the stack. Add a calling convention adjustment so we also return scalar `i128`s using the vector ABI, which makes our `i128` compatible with C. In the future, Clang may change to return `i128` on the stack for its `-msvc` targets (more at [1]). If this happens, the change here will need to be adjusted to only affect MinGW. Link: #134288
1 parent 581e0ac commit a44a20e

File tree

5 files changed

+44
-67
lines changed

5 files changed

+44
-67
lines changed

compiler/rustc_codegen_cranelift/src/abi/mod.rs

+13-9
Original file line numberDiff line numberDiff line change
@@ -122,7 +122,7 @@ impl<'tcx> FunctionCx<'_, '_, 'tcx> {
122122
&mut self,
123123
name: &str,
124124
params: Vec<AbiParam>,
125-
returns: Vec<AbiParam>,
125+
mut returns: Vec<AbiParam>,
126126
args: &[Value],
127127
) -> Cow<'_, [Value]> {
128128
// Pass i128 arguments by-ref on Windows.
@@ -146,15 +146,19 @@ impl<'tcx> FunctionCx<'_, '_, 'tcx> {
146146
(params, args.into())
147147
};
148148

149-
// Return i128 using a return area pointer on Windows and s390x.
150-
let adjust_ret_param =
151-
if self.tcx.sess.target.is_like_windows || self.tcx.sess.target.arch == "s390x" {
152-
returns.len() == 1 && returns[0].value_type == types::I128
153-
} else {
154-
false
155-
};
149+
let ret_single_i128 = returns.len() == 1 && returns[0].value_type == types::I128;
150+
if ret_single_i128 && self.tcx.sess.target.is_like_windows {
151+
// Return i128 using the vector ABI on Windows
152+
returns[0].value_type = types::I64X2;
153+
154+
let ret = self.lib_call_unadjusted(name, params, returns, &args)[0];
156155

157-
if adjust_ret_param {
156+
// FIXME(bytecodealliance/wasmtime#6104) use bitcast instead of store to get from i64x2 to i128
157+
let ret_ptr = self.create_stack_slot(16, 16);
158+
ret_ptr.store(self, ret, MemFlags::trusted());
159+
Cow::Owned(vec![ret_ptr.load(self, types::I128, MemFlags::trusted())])
160+
} else if ret_single_i128 && self.tcx.sess.target.arch == "s390x" {
161+
// Return i128 using a return area pointer on s390x.
158162
let mut params = params;
159163
let mut args = args.to_vec();
160164

compiler/rustc_codegen_cranelift/src/cast.rs

+3-19
Original file line numberDiff line numberDiff line change
@@ -96,25 +96,9 @@ pub(crate) fn clif_int_or_float_cast(
9696
},
9797
);
9898

99-
if fx.tcx.sess.target.is_like_windows {
100-
let ret = fx.lib_call(
101-
&name,
102-
vec![AbiParam::new(from_ty)],
103-
vec![AbiParam::new(types::I64X2)],
104-
&[from],
105-
)[0];
106-
// FIXME(bytecodealliance/wasmtime#6104) use bitcast instead of store to get from i64x2 to i128
107-
let ret_ptr = fx.create_stack_slot(16, 16);
108-
ret_ptr.store(fx, ret, MemFlags::trusted());
109-
ret_ptr.load(fx, types::I128, MemFlags::trusted())
110-
} else {
111-
fx.lib_call(
112-
&name,
113-
vec![AbiParam::new(from_ty)],
114-
vec![AbiParam::new(types::I128)],
115-
&[from],
116-
)[0]
117-
}
99+
fx.lib_call(&name, vec![AbiParam::new(from_ty)], vec![AbiParam::new(types::I128)], &[
100+
from,
101+
])[0]
118102
} else if to_ty == types::I8 || to_ty == types::I16 {
119103
// FIXME implement fcvt_to_*int_sat.i8/i16
120104
let val = if to_signed {

compiler/rustc_codegen_cranelift/src/codegen_i128.rs

+8-22
Original file line numberDiff line numberDiff line change
@@ -33,28 +33,14 @@ pub(crate) fn maybe_codegen<'tcx>(
3333
(BinOp::Rem, true) => "__modti3",
3434
_ => unreachable!(),
3535
};
36-
if fx.tcx.sess.target.is_like_windows {
37-
let args = [lhs.load_scalar(fx), rhs.load_scalar(fx)];
38-
let ret = fx.lib_call(
39-
name,
40-
vec![AbiParam::new(types::I128), AbiParam::new(types::I128)],
41-
vec![AbiParam::new(types::I64X2)],
42-
&args,
43-
)[0];
44-
// FIXME(bytecodealliance/wasmtime#6104) use bitcast instead of store to get from i64x2 to i128
45-
let ret_place = CPlace::new_stack_slot(fx, lhs.layout());
46-
ret_place.to_ptr().store(fx, ret, MemFlags::trusted());
47-
Some(ret_place.to_cvalue(fx))
48-
} else {
49-
let args = [lhs.load_scalar(fx), rhs.load_scalar(fx)];
50-
let ret_val = fx.lib_call(
51-
name,
52-
vec![AbiParam::new(types::I128), AbiParam::new(types::I128)],
53-
vec![AbiParam::new(types::I128)],
54-
&args,
55-
)[0];
56-
Some(CValue::by_val(ret_val, lhs.layout()))
57-
}
36+
let args = [lhs.load_scalar(fx), rhs.load_scalar(fx)];
37+
let ret_val = fx.lib_call(
38+
name,
39+
vec![AbiParam::new(types::I128), AbiParam::new(types::I128)],
40+
vec![AbiParam::new(types::I128)],
41+
&args,
42+
)[0];
43+
Some(CValue::by_val(ret_val, lhs.layout()))
5844
}
5945
BinOp::Lt | BinOp::Le | BinOp::Eq | BinOp::Ge | BinOp::Gt | BinOp::Ne | BinOp::Cmp => None,
6046
BinOp::Shl | BinOp::ShlUnchecked | BinOp::Shr | BinOp::ShrUnchecked => None,

compiler/rustc_target/src/callconv/x86_win64.rs

+13-7
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
1-
use rustc_abi::{BackendRepr, Float, Primitive};
1+
use rustc_abi::{BackendRepr, Float, Integer, Primitive, RegKind, Size};
22

33
use crate::abi::call::{ArgAbi, FnAbi, Reg};
44
use crate::spec::HasTargetSpec;
55

66
// Win64 ABI: https://docs.microsoft.com/en-us/cpp/build/parameter-passing
77

88
pub(crate) fn compute_abi_info<Ty>(_cx: &impl HasTargetSpec, fn_abi: &mut FnAbi<'_, Ty>) {
9-
let fixup = |a: &mut ArgAbi<'_, Ty>| {
9+
let fixup = |a: &mut ArgAbi<'_, Ty>, is_ret: bool| {
1010
match a.layout.backend_repr {
1111
BackendRepr::Uninhabited | BackendRepr::Memory { sized: false } => {}
1212
BackendRepr::ScalarPair(..) | BackendRepr::Memory { sized: true } => {
@@ -23,11 +23,16 @@ pub(crate) fn compute_abi_info<Ty>(_cx: &impl HasTargetSpec, fn_abi: &mut FnAbi<
2323
// (probably what clang calls "illegal vectors").
2424
}
2525
BackendRepr::Scalar(scalar) => {
26-
// Match what LLVM does for `f128` so that `compiler-builtins` builtins match up
27-
// with what LLVM expects.
28-
if a.layout.size.bytes() > 8
26+
if is_ret && matches!(scalar.primitive(), Primitive::Int(Integer::I128, _)) {
27+
// `i128` is returned in xmm0 by Clang and GCC
28+
// FIXME(#134288): This may change for the `-msvc` targets in the future.
29+
let reg = Reg { kind: RegKind::Vector, size: Size::from_bits(128) };
30+
a.cast_to(reg);
31+
} else if a.layout.size.bytes() > 8
2932
&& !matches!(scalar.primitive(), Primitive::Float(Float::F128))
3033
{
34+
// Match what LLVM does for `f128` so that `compiler-builtins` builtins match up
35+
// with what LLVM expects.
3136
a.make_indirect();
3237
} else {
3338
a.extend_integer_width_to(32);
@@ -37,8 +42,9 @@ pub(crate) fn compute_abi_info<Ty>(_cx: &impl HasTargetSpec, fn_abi: &mut FnAbi<
3742
};
3843

3944
if !fn_abi.ret.is_ignore() {
40-
fixup(&mut fn_abi.ret);
45+
fixup(&mut fn_abi.ret, true);
4146
}
47+
4248
for arg in fn_abi.args.iter_mut() {
4349
if arg.is_ignore() && arg.layout.is_zst() {
4450
// Windows ABIs do not talk about ZST since such types do not exist in MSVC.
@@ -49,7 +55,7 @@ pub(crate) fn compute_abi_info<Ty>(_cx: &impl HasTargetSpec, fn_abi: &mut FnAbi<
4955
arg.make_indirect_from_ignore();
5056
continue;
5157
}
52-
fixup(arg);
58+
fixup(arg, false);
5359
}
5460
// FIXME: We should likely also do something about ZST return types, similar to above.
5561
// However, that's non-trivial due to `()`.

tests/codegen/i128-x86-callconv.rs

+7-10
Original file line numberDiff line numberDiff line change
@@ -41,12 +41,11 @@ pub extern "C" fn pass(_arg0: u32, arg1: i128) {
4141
#[no_mangle]
4242
pub extern "C" fn ret(_arg0: u32, arg1: i128) -> i128 {
4343
// CHECK-LABEL: @ret(
44-
// i128 is returned on the stack on Windows.
45-
// FIXME: this ABI does not agree with Clang or MinGW GCC
46-
// WIN-SAME: ptr{{.*}} sret([16 x i8]){{.*}} [[RET:%_[0-9]+]], i32{{.*}} %_arg0, ptr{{.*}} %arg1)
47-
// WIN: [[LOADED:%[0-9]+]] = load i128, ptr %arg1
48-
// WIN: store i128 [[LOADED]], ptr [[RET]]
49-
// WIN: ret void
44+
// i128 is returned in xmm0 on Windows
45+
// FIXME(#134288): This may change for the `-msvc` targets in the future.
46+
// WIN-SAME: i32{{.*}} %_arg0, ptr{{.*}} %arg1)
47+
// WIN: [[LOADED:%[_0-9]+]] = load <16 x i8>, ptr %arg1
48+
// WIN-NEXT: ret <16 x i8> [[LOADED]]
5049
arg1
5150
}
5251

@@ -55,10 +54,8 @@ pub extern "C" fn ret(_arg0: u32, arg1: i128) -> i128 {
5554
pub extern "C" fn forward(dst: *mut i128) {
5655
// CHECK-LABEL: @forward
5756
// WIN-SAME: ptr{{.*}} %dst)
58-
// WIN: [[RETURNED:%[_0-9]+]] = alloca [16 x i8], align 16
59-
// WIN: call void @extern_ret({{.*}} [[RETURNED]])
60-
// WIN: [[TMP:%[_0-9]+]] = load i128, ptr [[RETURNED]]
61-
// WIN: store i128 [[TMP]], ptr %dst
57+
// WIN: [[RETURNED:%[_0-9]+]] = tail call <16 x i8> @extern_ret()
58+
// WIN: store <16 x i8> [[RETURNED]], ptr %dst
6259
// WIN: ret void
6360
unsafe { *dst = extern_ret() };
6461
}

0 commit comments

Comments
 (0)