Skip to content

Commit ee4cc72

Browse files
authored
Rollup merge of rust-lang#116099 - eduardosm:issue-79865-regression, r=oli-obk
Add regression test for issue rust-lang#79865 Closes rust-lang#79865
2 parents 27b4eb9 + b683684 commit ee4cc72

File tree

1 file changed

+38
-0
lines changed

1 file changed

+38
-0
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
// run-pass
2+
// only-x86_64
3+
// compile-flags: -C opt-level=3
4+
5+
// Regression test for issue #79865.
6+
// The assertion will fail when compiled with Rust 1.56..=1.59
7+
// due to a LLVM miscompilation.
8+
9+
use std::arch::x86_64::*;
10+
11+
fn main() {
12+
if is_x86_feature_detected!("avx") {
13+
let res: [f64; 4] = unsafe { std::mem::transmute::<_, _>(first()) };
14+
assert_eq!(res, [22.0, 44.0, 66.0, 88.0]);
15+
}
16+
}
17+
18+
#[target_feature(enable = "avx")]
19+
unsafe fn first() -> __m256d {
20+
second()
21+
}
22+
23+
unsafe fn second() -> __m256d {
24+
let v0 = _mm256_setr_pd(1.0, 2.0, 3.0, 4.0);
25+
let v1 = _mm256_setr_pd(10.0, 20.0, 30.0, 40.0);
26+
27+
// needs to be called twice to hit the miscompilation
28+
let (add, _) = add_sub(v0, v1);
29+
let (add, _) = add_sub(add, add);
30+
add
31+
}
32+
33+
#[inline(never)] // needed to hit the miscompilation
34+
unsafe fn add_sub(v1: __m256d, v0: __m256d) -> (__m256d, __m256d) {
35+
let add = _mm256_add_pd(v0, v1);
36+
let sub = _mm256_sub_pd(v0, v1);
37+
(add, sub)
38+
}

0 commit comments

Comments
 (0)