summaryrefslogtreecommitdiffstats
path: root/tests/ui/codegen/issue-79865-llvm-miscompile.rs
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-05-30 18:31:44 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-05-30 18:31:44 +0000
commitc23a457e72abe608715ac76f076f47dc42af07a5 (patch)
tree2772049aaf84b5c9d0ed12ec8d86812f7a7904b6 /tests/ui/codegen/issue-79865-llvm-miscompile.rs
parentReleasing progress-linux version 1.73.0+dfsg1-1~progress7.99u1. (diff)
downloadrustc-c23a457e72abe608715ac76f076f47dc42af07a5.tar.xz
rustc-c23a457e72abe608715ac76f076f47dc42af07a5.zip
Merging upstream version 1.74.1+dfsg1.
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'tests/ui/codegen/issue-79865-llvm-miscompile.rs')
-rw-r--r--tests/ui/codegen/issue-79865-llvm-miscompile.rs38
1 files changed, 38 insertions, 0 deletions
diff --git a/tests/ui/codegen/issue-79865-llvm-miscompile.rs b/tests/ui/codegen/issue-79865-llvm-miscompile.rs
new file mode 100644
index 000000000..b77f09f8e
--- /dev/null
+++ b/tests/ui/codegen/issue-79865-llvm-miscompile.rs
@@ -0,0 +1,38 @@
+// run-pass
+// only-x86_64
+// compile-flags: -C opt-level=3
+
+// Regression test for issue #79865.
+// The assertion will fail when compiled with Rust 1.56..=1.59
+// due to a LLVM miscompilation.
+
+use std::arch::x86_64::*;
+
+fn main() {
+ if is_x86_feature_detected!("avx") {
+ let res: [f64; 4] = unsafe { std::mem::transmute::<_, _>(first()) };
+ assert_eq!(res, [22.0, 44.0, 66.0, 88.0]);
+ }
+}
+
+#[target_feature(enable = "avx")]
+unsafe fn first() -> __m256d {
+ second()
+}
+
+unsafe fn second() -> __m256d {
+ let v0 = _mm256_setr_pd(1.0, 2.0, 3.0, 4.0);
+ let v1 = _mm256_setr_pd(10.0, 20.0, 30.0, 40.0);
+
+ // needs to be called twice to hit the miscompilation
+ let (add, _) = add_sub(v0, v1);
+ let (add, _) = add_sub(add, add);
+ add
+}
+
+#[inline(never)] // needed to hit the miscompilation
+unsafe fn add_sub(v1: __m256d, v0: __m256d) -> (__m256d, __m256d) {
+ let add = _mm256_add_pd(v0, v1);
+ let sub = _mm256_sub_pd(v0, v1);
+ (add, sub)
+}