fortrangoingonforty/armfortas / 2c6ef19

Browse files

Test O3 picks NEON copy form and runtime preserves element values

Authored by mfwolffe <wolffemf@dukes.jmu.edu>
SHA
2c6ef19ed482b1c65dbf34a8656340b34cbf02ce
Parents
7703ccf
Tree
4c262c4

1 changed file

StatusFile+-
A tests/vectorize_array_copy.rs 79 0
tests/vectorize_array_copy.rsadded
@@ -0,0 +1,79 @@
1
+use std::collections::BTreeSet;
2
+use std::path::PathBuf;
3
+
4
+use armfortas::driver::OptLevel;
5
+use armfortas::testing::{capture_from_path, CaptureRequest, CapturedStage, Stage};
6
+
7
+fn fixture(name: &str) -> PathBuf {
8
+    let path = PathBuf::from("test_programs").join(name);
9
+    assert!(path.exists(), "missing test fixture {}", path.display());
10
+    path
11
+}
12
+
13
+fn capture_text(request: CaptureRequest, stage: Stage) -> String {
14
+    let result = capture_from_path(&request).expect("capture should succeed");
15
+    match result.get(stage) {
16
+        Some(CapturedStage::Text(text)) => text.clone(),
17
+        Some(CapturedStage::Run(_)) => panic!("expected text stage for {}", stage.as_str()),
18
+        None => panic!("missing requested stage {}", stage.as_str()),
19
+    }
20
+}
21
+
22
+fn capture_run_stdout(request: CaptureRequest) -> String {
23
+    let result = capture_from_path(&request).expect("capture should succeed");
24
+    match result.get(Stage::Run) {
25
+        Some(CapturedStage::Run(run)) => run.stdout.clone(),
26
+        _ => panic!("missing run stage"),
27
+    }
28
+}
29
+
30
+#[test]
31
+fn o3_vectorizes_pure_array_copy_loop() {
32
+    let source = fixture("do_loop_vectorize_copy.f90");
33
+
34
+    let o3_ir = capture_text(
35
+        CaptureRequest {
36
+            input: source.clone(),
37
+            requested: BTreeSet::from([Stage::OptIr]),
38
+            opt_level: OptLevel::O3,
39
+        },
40
+        Stage::OptIr,
41
+    );
42
+
43
+    // Either NeonVectorize (vload/vstore inline, no v-binop) or the
44
+    // older Vectorize fallback (afs_array_copy_i32) is acceptable.
45
+    let neon = o3_ir.contains("vload")
46
+        && o3_ir.contains("vstore")
47
+        && !o3_ir.contains("vadd")
48
+        && !o3_ir.contains("vsub")
49
+        && !o3_ir.contains("vmul");
50
+    let kernel = o3_ir.contains("call @afs_array_copy_i32(");
51
+    assert!(
52
+        neon || kernel,
53
+        "O3 should vectorize a pure c(i) = b(i) copy loop:\n{}",
54
+        o3_ir
55
+    );
56
+    assert!(
57
+        neon,
58
+        "O3 should pick the NeonVectorize copy path over the runtime kernel:\n{}",
59
+        o3_ir
60
+    );
61
+
62
+    // Runtime check: c(1) = 1 and c(32) = 32 (b is filled with index).
63
+    let stdout = capture_run_stdout(CaptureRequest {
64
+        input: source,
65
+        requested: BTreeSet::from([Stage::Run]),
66
+        opt_level: OptLevel::O3,
67
+    });
68
+    let trimmed: Vec<&str> = stdout
69
+        .lines()
70
+        .map(|l| l.trim())
71
+        .filter(|l| !l.is_empty())
72
+        .collect();
73
+    assert_eq!(
74
+        trimmed,
75
+        vec!["1", "32"],
76
+        "vectorized copy should preserve element values:\n{}",
77
+        stdout
78
+    );
79
+}