fortrangoingonforty/armfortas / 6bfb8b4

Browse files

Test WHERE then-arm binop on second array load vectorizes at O3

Authored by mfwolffe <wolffemf@dukes.jmu.edu>
SHA
6bfb8b4b76da9b426db1d67a24a82ec6c33e1d77
Parents
faff757
Tree
f56f6b0

2 changed files

StatusFile+-
A test_programs/do_loop_vectorize_where_binop_on_b.f90 29 0
A tests/vectorize_where_binop_on_b.rs 71 0
test_programs/do_loop_vectorize_where_binop_on_b.f90added
@@ -0,0 +1,29 @@
1
+! WHERE then-arm with binop where the main load is on a SECOND array,
2
+! paired with a loop-invariant scalar:
3
+!   where (a > 0) c = K + d
4
+!
5
+! Lifts to vselect(mask, vadd(vbcast(K), vload(d)), vload_c_old).
6
+!
7
+! a(i) = i - 16; d(i) = real(i, 4); c(i) = 0.
8
+! WHERE a > 0 (lanes 17..32): c ← 100 + d (= 117 .. 132).
9
+!   c(1)  = 0.0   (mask=false)
10
+!   c(16) = 0.0   (a(16)=0, NOT > 0)
11
+!   c(17) = 117.0 (mask=true → 100 + d(17) = 100 + 17)
12
+!   c(32) = 132.0 (mask=true → 100 + d(32) = 100 + 32)
13
+!
14
+! CHECK: 0.0000000E0     0.0000000E0     1.1700000E2     1.3200000E2
15
+program test_do_loop_vectorize_where_binop_on_b
16
+  implicit none
17
+  integer :: i
18
+  real(4) :: a(32), c(32), d(32), hundred
19
+  hundred = 100.0
20
+  do i = 1, 32
21
+    a(i) = real(i - 16, 4)
22
+    d(i) = real(i, 4)
23
+    c(i) = 0.0
24
+  end do
25
+  where (a > 0.0)
26
+    c = hundred + d
27
+  end where
28
+  print *, c(1), c(16), c(17), c(32)
29
+end program test_do_loop_vectorize_where_binop_on_b
tests/vectorize_where_binop_on_b.rsadded
@@ -0,0 +1,71 @@
1
+use std::collections::BTreeSet;
2
+use std::path::PathBuf;
3
+
4
+use armfortas::driver::OptLevel;
5
+use armfortas::testing::{capture_from_path, CaptureRequest, CapturedStage, Stage};
6
+
7
+fn fixture(name: &str) -> PathBuf {
8
+    let path = PathBuf::from("test_programs").join(name);
9
+    assert!(path.exists(), "missing test fixture {}", path.display());
10
+    path
11
+}
12
+
13
+fn capture_text(request: CaptureRequest, stage: Stage) -> String {
14
+    let result = capture_from_path(&request).expect("capture should succeed");
15
+    match result.get(stage) {
16
+        Some(CapturedStage::Text(text)) => text.clone(),
17
+        Some(CapturedStage::Run(_)) => panic!("expected text stage for {}", stage.as_str()),
18
+        None => panic!("missing requested stage {}", stage.as_str()),
19
+    }
20
+}
21
+
22
+fn capture_run_stdout(request: CaptureRequest) -> String {
23
+    let result = capture_from_path(&request).expect("capture should succeed");
24
+    match result.get(Stage::Run) {
25
+        Some(CapturedStage::Run(run)) => run.stdout.clone(),
26
+        _ => panic!("missing run stage"),
27
+    }
28
+}
29
+
30
+#[test]
31
+fn o3_vectorizes_where_with_binop_on_second_array_load() {
32
+    let source = fixture("do_loop_vectorize_where_binop_on_b.f90");
33
+
34
+    let o3_ir = capture_text(
35
+        CaptureRequest {
36
+            input: source.clone(),
37
+            requested: BTreeSet::from([Stage::OptIr]),
38
+            opt_level: OptLevel::O3,
39
+        },
40
+        Stage::OptIr,
41
+    );
42
+    assert_eq!(
43
+        o3_ir.matches("vselect").count(),
44
+        1,
45
+        "expected one vselect:\n{}",
46
+        o3_ir
47
+    );
48
+    assert!(
49
+        o3_ir.contains("vadd"),
50
+        "expected vadd lifted from `c = K + d` then arm:\n{}",
51
+        o3_ir
52
+    );
53
+
54
+    let stdout = capture_run_stdout(CaptureRequest {
55
+        input: source,
56
+        requested: BTreeSet::from([Stage::Run]),
57
+        opt_level: OptLevel::O3,
58
+    });
59
+    let trimmed: Vec<&str> = stdout
60
+        .lines()
61
+        .map(|l| l.trim())
62
+        .filter(|l| !l.is_empty())
63
+        .collect();
64
+    assert_eq!(trimmed.len(), 1, "expected one output line:\n{}", stdout);
65
+    assert_eq!(
66
+        trimmed[0],
67
+        "0.0000000E0     0.0000000E0     1.1700000E2     1.3200000E2",
68
+        "WHERE-binop-on-b wrong: {:?}",
69
+        trimmed[0]
70
+    );
71
+}