|
| 1 | +// run-pass |
| 2 | +// only-x86_64 |
| 3 | +// compile-flags: -C opt-level=3 |
| 4 | + |
| 5 | +// Regression test for issue #79865. |
| 6 | +// The assertion will fail when compiled with Rust 1.56..=1.59 |
| 7 | +// due to a LLVM miscompilation. |
| 8 | + |
| 9 | +use std::arch::x86_64::*; |
| 10 | + |
| 11 | +fn main() { |
| 12 | + if is_x86_feature_detected!("avx") { |
| 13 | + let res: [f64; 4] = unsafe { std::mem::transmute::<_, _>(first()) }; |
| 14 | + assert_eq!(res, [22.0, 44.0, 66.0, 88.0]); |
| 15 | + } |
| 16 | +} |
| 17 | + |
| 18 | +#[target_feature(enable = "avx")] |
| 19 | +unsafe fn first() -> __m256d { |
| 20 | + second() |
| 21 | +} |
| 22 | + |
| 23 | +unsafe fn second() -> __m256d { |
| 24 | + let v0 = _mm256_setr_pd(1.0, 2.0, 3.0, 4.0); |
| 25 | + let v1 = _mm256_setr_pd(10.0, 20.0, 30.0, 40.0); |
| 26 | + |
| 27 | + // needs to be called twice to hit the miscompilation |
| 28 | + let (add, _) = add_sub(v0, v1); |
| 29 | + let (add, _) = add_sub(add, add); |
| 30 | + add |
| 31 | +} |
| 32 | + |
| 33 | +#[inline(never)] // needed to hit the miscompilation |
| 34 | +unsafe fn add_sub(v1: __m256d, v0: __m256d) -> (__m256d, __m256d) { |
| 35 | + let add = _mm256_add_pd(v0, v1); |
| 36 | + let sub = _mm256_sub_pd(v0, v1); |
| 37 | + (add, sub) |
| 38 | +} |
0 commit comments