Rust · 2524 bytes Raw Blame History
1 use std::collections::BTreeSet;
2 use std::path::PathBuf;
3
4 use armfortas::driver::OptLevel;
5 use armfortas::testing::{capture_from_path, CaptureRequest, CapturedStage, Stage};
6
7 fn fixture(name: &str) -> PathBuf {
8 let path = PathBuf::from("test_programs").join(name);
9 assert!(path.exists(), "missing test fixture {}", path.display());
10 path
11 }
12
13 fn capture_text(request: CaptureRequest, stage: Stage) -> String {
14 let result = capture_from_path(&request).expect("capture should succeed");
15 match result.get(stage) {
16 Some(CapturedStage::Text(text)) => text.clone(),
17 Some(CapturedStage::Run(_)) => panic!("expected text stage for {}", stage.as_str()),
18 None => panic!("missing requested stage {}", stage.as_str()),
19 }
20 }
21
22 fn capture_run_stdout(request: CaptureRequest) -> String {
23 let result = capture_from_path(&request).expect("capture should succeed");
24 match result.get(Stage::Run) {
25 Some(CapturedStage::Run(run)) => run.stdout.clone(),
26 _ => panic!("missing run stage"),
27 }
28 }
29
30 #[test]
31 fn o3_vectorizes_pure_array_copy_loop() {
32 let source = fixture("do_loop_vectorize_copy.f90");
33
34 let o3_ir = capture_text(
35 CaptureRequest {
36 input: source.clone(),
37 requested: BTreeSet::from([Stage::OptIr]),
38 opt_level: OptLevel::O3,
39 },
40 Stage::OptIr,
41 );
42
43 // Either NeonVectorize (vload/vstore inline, no v-binop) or the
44 // older Vectorize fallback (afs_array_copy_i32) is acceptable.
45 let neon = o3_ir.contains("vload")
46 && o3_ir.contains("vstore")
47 && !o3_ir.contains("vadd")
48 && !o3_ir.contains("vsub")
49 && !o3_ir.contains("vmul");
50 let kernel = o3_ir.contains("call @afs_array_copy_i32(");
51 assert!(
52 neon || kernel,
53 "O3 should vectorize a pure c(i) = b(i) copy loop:\n{}",
54 o3_ir
55 );
56 assert!(
57 neon,
58 "O3 should pick the NeonVectorize copy path over the runtime kernel:\n{}",
59 o3_ir
60 );
61
62 // Runtime check: c(1) = 1 and c(32) = 32 (b is filled with index).
63 let stdout = capture_run_stdout(CaptureRequest {
64 input: source,
65 requested: BTreeSet::from([Stage::Run]),
66 opt_level: OptLevel::O3,
67 });
68 let trimmed: Vec<&str> = stdout
69 .lines()
70 .map(|l| l.trim())
71 .filter(|l| !l.is_empty())
72 .collect();
73 assert_eq!(
74 trimmed,
75 vec!["1", "32"],
76 "vectorized copy should preserve element values:\n{}",
77 stdout
78 );
79 }
80