fortrangoingonforty/armfortas / 71d02aa

Browse files

Test WHERE/ELSEWHERE array-load else vectorizes at O3

Authored by mfwolffe <wolffemf@dukes.jmu.edu>
SHA
71d02aab73790841e70ccfa44a056186c4c834cb
Parents
9173691
Tree
de3cb38

2 changed files

StatusFile+-
A test_programs/do_loop_vectorize_where_elsewhere_arr.f90 30 0
A tests/vectorize_where_elsewhere_arr.rs 74 0
test_programs/do_loop_vectorize_where_elsewhere_arr.f90added
@@ -0,0 +1,30 @@
1
+! WHERE / ELSEWHERE both arms loading from arrays:
2
+!   where (a > 0) c = a
3
+!   elsewhere    c = b
4
+! lowers to vselect(mask, vload_a, vload_b) → vstore_c.
5
+!
6
+! a(i) = i - 16 (range -15..16); b(i) = 1000.0 + i; c(i) = 0.
7
+! WHERE a > 0 (lanes 17..32): c ← a (= 1..16).
8
+! ELSEWHERE                    : c ← b (= 1001..1016 for lanes 1..16).
9
+!   c(1)  = 1001 (mask=false → b(1))
10
+!   c(16) = 1016 (a(16)=0, NOT > 0 → b(16))
11
+!   c(17) = 1.0  (mask=true → a = 1)
12
+!   c(32) = 16.0 (mask=true → a = 16)
13
+!
14
+! CHECK: 1.0010000E3     1.0160000E3     1.0000000E0     1.6000000E1
15
+program test_do_loop_vectorize_where_elsewhere_arr
16
+  implicit none
17
+  integer :: i
18
+  real(4) :: a(32), b(32), c(32)
19
+  do i = 1, 32
20
+    a(i) = real(i - 16, 4)
21
+    b(i) = real(1000 + i, 4)
22
+    c(i) = 0.0
23
+  end do
24
+  where (a > 0.0)
25
+    c = a
26
+  elsewhere
27
+    c = b
28
+  end where
29
+  print *, c(1), c(16), c(17), c(32)
30
+end program test_do_loop_vectorize_where_elsewhere_arr
tests/vectorize_where_elsewhere_arr.rsadded
@@ -0,0 +1,74 @@
1
+use std::collections::BTreeSet;
2
+use std::path::PathBuf;
3
+
4
+use armfortas::driver::OptLevel;
5
+use armfortas::testing::{capture_from_path, CaptureRequest, CapturedStage, Stage};
6
+
7
+fn fixture(name: &str) -> PathBuf {
8
+    let path = PathBuf::from("test_programs").join(name);
9
+    assert!(path.exists(), "missing test fixture {}", path.display());
10
+    path
11
+}
12
+
13
+fn capture_text(request: CaptureRequest, stage: Stage) -> String {
14
+    let result = capture_from_path(&request).expect("capture should succeed");
15
+    match result.get(stage) {
16
+        Some(CapturedStage::Text(text)) => text.clone(),
17
+        Some(CapturedStage::Run(_)) => panic!("expected text stage for {}", stage.as_str()),
18
+        None => panic!("missing requested stage {}", stage.as_str()),
19
+    }
20
+}
21
+
22
+fn capture_run_stdout(request: CaptureRequest) -> String {
23
+    let result = capture_from_path(&request).expect("capture should succeed");
24
+    match result.get(Stage::Run) {
25
+        Some(CapturedStage::Run(run)) => run.stdout.clone(),
26
+        _ => panic!("missing run stage"),
27
+    }
28
+}
29
+
30
+#[test]
31
+fn o3_vectorizes_where_elsewhere_with_array_load_else() {
32
+    let source = fixture("do_loop_vectorize_where_elsewhere_arr.f90");
33
+
34
+    let o3_ir = capture_text(
35
+        CaptureRequest {
36
+            input: source.clone(),
37
+            requested: BTreeSet::from([Stage::OptIr]),
38
+            opt_level: OptLevel::O3,
39
+        },
40
+        Stage::OptIr,
41
+    );
42
+    // The two-arm `c = a; elsewhere; c = d` should produce a vselect
43
+    // whose true arm is vload(a) and false arm is vload(d) — at
44
+    // least 2 vloads in the WHERE body block.
45
+    assert_eq!(
46
+        o3_ir.matches("vselect").count(),
47
+        1,
48
+        "expected exactly one vselect:\n{}",
49
+        o3_ir
50
+    );
51
+    assert!(
52
+        o3_ir.matches("vload").count() >= 2,
53
+        "expected ≥2 vloads (a and d):\n{}",
54
+        o3_ir
55
+    );
56
+
57
+    let stdout = capture_run_stdout(CaptureRequest {
58
+        input: source,
59
+        requested: BTreeSet::from([Stage::Run]),
60
+        opt_level: OptLevel::O3,
61
+    });
62
+    let trimmed: Vec<&str> = stdout
63
+        .lines()
64
+        .map(|l| l.trim())
65
+        .filter(|l| !l.is_empty())
66
+        .collect();
67
+    assert_eq!(trimmed.len(), 1, "expected one output line:\n{}", stdout);
68
+    assert_eq!(
69
+        trimmed[0],
70
+        "1.0010000E3     1.0160000E3     1.0000000E0     1.6000000E1",
71
+        "WHERE/ELSEWHERE-arr wrong: {:?}",
72
+        trimmed[0]
73
+    );
74
+}