move test code to a separate module

egraphs-good · Jan 13, 2024 · 426dcae · 426dcae
1 parent 82d0eca
commit 426dcae
Show file tree

Hide file tree

Showing 2 changed files with 176 additions and 169 deletions.
diff --git a/src/extract/mod.rs b/src/extract/mod.rs
@@ -201,90 +201,3 @@ impl ExtractionResult {
                 .sum::<Cost>()
     }
 }
-
-use ordered_float::NotNan;
-use rand::Rng;
-
-// generates a float between 0 and 1
-fn generate_random_not_nan() -> NotNan<f64> {
-    let mut rng: rand::prelude::ThreadRng = rand::thread_rng();
-    let random_float: f64 = rng.gen();
-    NotNan::new(random_float).unwrap()
-}
-
-//make a random egraph that has a loop-free extraction.
-pub fn generate_random_egraph() -> EGraph {
-    let mut rng = rand::thread_rng();
-    let core_node_count = rng.gen_range(1..100) as usize;
-    let extra_node_count = rng.gen_range(1..100);
-    let mut nodes: Vec<Node> = Vec::with_capacity(core_node_count + extra_node_count);
-    let mut eclass = 0;
-
-    let id2nid = |id: usize| -> NodeId { format!("node_{}", id).into() };
-
-    // Unless we do it explicitly, the costs are almost never equal to others' costs or zero:
-    let get_semi_random_cost = |nodes: &Vec<Node>| -> Cost {
-        let mut rng = rand::thread_rng();
-
-        if nodes.len() > 0 && rng.gen_bool(0.1) {
-            return nodes[rng.gen_range(0..nodes.len())].cost;
-        } else if rng.gen_bool(0.05) {
-            return Cost::default();
-        } else {
-            return generate_random_not_nan() * 100.0;
-        }
-    };
-
-    for i in 0..core_node_count {
-        let children: Vec<NodeId> = (0..i).filter(|_| rng.gen_bool(0.1)).map(id2nid).collect();
-
-        if rng.gen_bool(0.2) {
-            eclass += 1;
-        }
-
-        nodes.push(Node {
-            op: "operation".to_string(),
-            children: children,
-            eclass: eclass.to_string().clone().into(),
-            cost: get_semi_random_cost(&nodes),
-        });
-    }
-
-    // So far we have the nodes for a feasible egraph. Now we add some
-    // cycles to extra nodes - nodes that aren't required in the extraction.
-    for _ in 0..extra_node_count {
-        nodes.push(Node {
-            op: "operation".to_string(),
-            children: vec![],
-            eclass: rng.gen_range(0..eclass * 2 + 1).to_string().clone().into(),
-            cost: get_semi_random_cost(&nodes),
-        });
-    }
-
-    for i in core_node_count..nodes.len() {
-        for j in 0..nodes.len() {
-            if rng.gen_bool(0.05) {
-                nodes.get_mut(i).unwrap().children.push(id2nid(j));
-            }
-        }
-    }
-
-    let mut egraph = EGraph::default();
-
-    for i in 0..nodes.len() {
-        egraph.add_node(id2nid(i), nodes[i].clone());
-    }
-
-    // Set roots
-    for _ in 1..rng.gen_range(2..6) {
-        egraph.root_eclasses.push(
-            nodes
-                .get(rng.gen_range(0..core_node_count))
-                .unwrap()
-                .eclass
-                .clone(),
-        );
-    }
-
-    egraph
-}
diff --git a/src/main.rs b/src/main.rs
@@ -152,111 +152,204 @@ fn main() {
     .unwrap();
 }
 
-/*
-* Checks that no extractors produce better results than the extractors that produce optimal results.
-* Checks that the extractions are valid.
-*/
-
-fn check_optimal_results<I: Iterator<Item = EGraph>>(egraphs: I) {
-    let mut optimal_dag: Vec<Box<dyn Extractor>> = Default::default();
-    let mut optimal_tree: Vec<Box<dyn Extractor>> = Default::default();
-    let mut others: Vec<Box<dyn Extractor>> = Default::default();
-
-    for (_, ed) in extractors().into_iter() {
-        match ed.optimal {
-            Optimal::DAG => optimal_dag.push(ed.extractor),
-            Optimal::Tree => optimal_tree.push(ed.extractor),
-            Optimal::Neither => others.push(ed.extractor),
-        }
+#[cfg(test)]
+mod main_test {
+    /*
+     * Checks that no extractors produce better results than the extractors that produce optimal results.
+     * Checks that the extractions are valid.
+     */
+
+    use crate::{extractors, Extractor, Optimal, EPSILON_ALLOWANCE};
+    pub type Cost = NotNan<f64>;
+    use egraph_serialize::{EGraph, Node, NodeId};
+    use ordered_float::NotNan;
+    use rand::Rng;
+
+    // generates a float between 0 and 1
+    fn generate_random_not_nan() -> NotNan<f64> {
+        let mut rng: rand::prelude::ThreadRng = rand::thread_rng();
+        let random_float: f64 = rng.gen();
+        NotNan::new(random_float).unwrap()
     }
 
-    for egraph in egraphs {
-        let mut optimal_dag_cost: Option<Cost> = None;
-
-        for e in &optimal_dag {
-            let extract = e.extract(&egraph, &egraph.root_eclasses);
-            extract.check(&egraph);
-            let dag_cost = extract.dag_cost(&egraph, &egraph.root_eclasses);
-            let tree_cost = extract.tree_cost(&egraph, &egraph.root_eclasses);
-            if optimal_dag_cost.is_none() {
-                optimal_dag_cost = Some(dag_cost);
-                continue;
+    //make a random egraph that has a loop-free extraction.
+    pub fn generate_random_egraph() -> EGraph {
+        let mut rng = rand::thread_rng();
+        let core_node_count = rng.gen_range(1..100) as usize;
+        let extra_node_count = rng.gen_range(1..100);
+        let mut nodes: Vec<Node> = Vec::with_capacity(core_node_count + extra_node_count);
+        let mut eclass = 0;
+
+        let id2nid = |id: usize| -> NodeId { format!("node_{}", id).into() };
+
+        // Unless we do it explicitly, the costs are almost never equal to others' costs or zero:
+        let get_semi_random_cost = |nodes: &Vec<Node>| -> Cost {
+            let mut rng = rand::thread_rng();
+
+            if nodes.len() > 0 && rng.gen_bool(0.1) {
+                return nodes[rng.gen_range(0..nodes.len())].cost;
+            } else if rng.gen_bool(0.05) {
+                return Cost::default();
+            } else {
+                return generate_random_not_nan() * 100.0;
             }
+        };
 
-            assert!(
-                (dag_cost.into_inner() - optimal_dag_cost.unwrap().into_inner()).abs()
-                    < EPSILON_ALLOWANCE
-            );
+        for i in 0..core_node_count {
+            let children: Vec<NodeId> = (0..i).filter(|_| rng.gen_bool(0.1)).map(id2nid).collect();
 
-            assert!(
-                tree_cost.into_inner() + EPSILON_ALLOWANCE > optimal_dag_cost.unwrap().into_inner()
-            );
+            if rng.gen_bool(0.2) {
+                eclass += 1;
+            }
+
+            nodes.push(Node {
+                op: "operation".to_string(),
+                children: children,
+                eclass: eclass.to_string().clone().into(),
+                cost: get_semi_random_cost(&nodes),
+            });
         }
 
-        let mut optimal_tree_cost: Option<Cost> = None;
+        // So far we have the nodes for a feasible egraph. Now we add some
+        // cycles to extra nodes - nodes that aren't required in the extraction.
+        for _ in 0..extra_node_count {
+            nodes.push(Node {
+                op: "operation".to_string(),
+                children: vec![],
+                eclass: rng.gen_range(0..eclass * 2 + 1).to_string().clone().into(),
+                cost: get_semi_random_cost(&nodes),
+            });
+        }
 
-        for e in &optimal_tree {
-            let extract = e.extract(&egraph, &egraph.root_eclasses);
-            extract.check(&egraph);
-            let tree_cost = extract.tree_cost(&egraph, &egraph.root_eclasses);
-            if optimal_tree_cost.is_none() {
-                optimal_tree_cost = Some(tree_cost);
-                continue;
+        for i in core_node_count..nodes.len() {
+            for j in 0..nodes.len() {
+                if rng.gen_bool(0.05) {
+                    nodes.get_mut(i).unwrap().children.push(id2nid(j));
+                }
             }
+        }
+
+        let mut egraph = EGraph::default();
+
+        for i in 0..nodes.len() {
+            egraph.add_node(id2nid(i), nodes[i].clone());
+        }
 
-            assert!(
-                (tree_cost.into_inner() - optimal_tree_cost.unwrap().into_inner()).abs()
-                    < EPSILON_ALLOWANCE
+        // Set roots
+        for _ in 1..rng.gen_range(2..6) {
+            egraph.root_eclasses.push(
+                nodes
+                    .get(rng.gen_range(0..core_node_count))
+                    .unwrap()
+                    .eclass
+                    .clone(),
             );
         }
 
-        if optimal_dag_cost.is_some() && optimal_tree_cost.is_some() {
-            assert!(optimal_dag_cost.unwrap() < optimal_tree_cost.unwrap() + EPSILON_ALLOWANCE);
+        egraph
+    }
+
+    fn check_optimal_results<I: Iterator<Item = EGraph>>(egraphs: I) {
+        let mut optimal_dag: Vec<Box<dyn Extractor>> = Default::default();
+        let mut optimal_tree: Vec<Box<dyn Extractor>> = Default::default();
+        let mut others: Vec<Box<dyn Extractor>> = Default::default();
+
+        for (_, ed) in extractors().into_iter() {
+            match ed.optimal {
+                Optimal::DAG => optimal_dag.push(ed.extractor),
+                Optimal::Tree => optimal_tree.push(ed.extractor),
+                Optimal::Neither => others.push(ed.extractor),
+            }
         }
 
-        for e in &others {
-            let extract = e.extract(&egraph, &egraph.root_eclasses);
-            extract.check(&egraph);
-            let tree_cost = extract.tree_cost(&egraph, &egraph.root_eclasses);
-            let dag_cost = extract.dag_cost(&egraph, &egraph.root_eclasses);
+        for egraph in egraphs {
+            let mut optimal_dag_cost: Option<Cost> = None;
+
+            for e in &optimal_dag {
+                let extract = e.extract(&egraph, &egraph.root_eclasses);
+                extract.check(&egraph);
+                let dag_cost = extract.dag_cost(&egraph, &egraph.root_eclasses);
+                let tree_cost = extract.tree_cost(&egraph, &egraph.root_eclasses);
+                if optimal_dag_cost.is_none() {
+                    optimal_dag_cost = Some(dag_cost);
+                    continue;
+                }
+
+                assert!(
+                    (dag_cost.into_inner() - optimal_dag_cost.unwrap().into_inner()).abs()
+                        < EPSILON_ALLOWANCE
+                );
+
+                assert!(
+                    tree_cost.into_inner() + EPSILON_ALLOWANCE
+                        > optimal_dag_cost.unwrap().into_inner()
+                );
+            }
+
+            let mut optimal_tree_cost: Option<Cost> = None;
+
+            for e in &optimal_tree {
+                let extract = e.extract(&egraph, &egraph.root_eclasses);
+                extract.check(&egraph);
+                let tree_cost = extract.tree_cost(&egraph, &egraph.root_eclasses);
+                if optimal_tree_cost.is_none() {
+                    optimal_tree_cost = Some(tree_cost);
+                    continue;
+                }
+
+                assert!(
+                    (tree_cost.into_inner() - optimal_tree_cost.unwrap().into_inner()).abs()
+                        < EPSILON_ALLOWANCE
+                );
+            }
 
-            // The optimal tree cost should be <= any extractor's tree cost.
-            if optimal_tree_cost.is_some() {
-                assert!(optimal_tree_cost.unwrap() <= tree_cost + EPSILON_ALLOWANCE);
+            if optimal_dag_cost.is_some() && optimal_tree_cost.is_some() {
+                assert!(optimal_dag_cost.unwrap() < optimal_tree_cost.unwrap() + EPSILON_ALLOWANCE);
             }
 
-            if optimal_dag_cost.is_some() {
-                // The optimal dag should be less <= any extractor's dag cost
-                assert!(optimal_dag_cost.unwrap() <= dag_cost + EPSILON_ALLOWANCE);
+            for e in &others {
+                let extract = e.extract(&egraph, &egraph.root_eclasses);
+                extract.check(&egraph);
+                let tree_cost = extract.tree_cost(&egraph, &egraph.root_eclasses);
+                let dag_cost = extract.dag_cost(&egraph, &egraph.root_eclasses);
+
+                // The optimal tree cost should be <= any extractor's tree cost.
+                if optimal_tree_cost.is_some() {
+                    assert!(optimal_tree_cost.unwrap() <= tree_cost + EPSILON_ALLOWANCE);
+                }
+
+                if optimal_dag_cost.is_some() {
+                    // The optimal dag should be less <= any extractor's dag cost
+                    assert!(optimal_dag_cost.unwrap() <= dag_cost + EPSILON_ALLOWANCE);
+                }
             }
         }
     }
-}
 
-// Run on all the .json files in the data/fuzz directory
-#[test]
-fn run_on_test_egraphs() {
-    use walkdir::WalkDir;
-
-    let egraphs = WalkDir::new("./test_data/")
-        .into_iter()
-        .filter_map(Result::ok)
-        .filter(|e| {
-            e.file_type().is_file()
-                && e.path().extension().and_then(std::ffi::OsStr::to_str) == Some("json")
-        })
-        .map(|e| e.path().to_string_lossy().into_owned())
-        .map(|e| EGraph::from_json_file(e).unwrap());
-    check_optimal_results(egraphs);
-}
+    // Run on all the .json test files
+    #[test]
+    fn run_on_test_egraphs() {
+        use walkdir::WalkDir;
+
+        let egraphs = WalkDir::new("./test_data/")
+            .into_iter()
+            .filter_map(Result::ok)
+            .filter(|e| {
+                e.file_type().is_file()
+                    && e.path().extension().and_then(std::ffi::OsStr::to_str) == Some("json")
+            })
+            .map(|e| e.path().to_string_lossy().into_owned())
+            .map(|e| EGraph::from_json_file(e).unwrap());
+        check_optimal_results(egraphs);
+    }
 
-#[test]
-#[should_panic]
-fn check_assert_enabled() {
-    assert!(false);
-}
+    #[test]
+    #[should_panic]
+    fn check_assert_enabled() {
+        assert!(false);
+    }
 
-macro_rules! create_optimal_check_tests {
+    macro_rules! create_optimal_check_tests {
     ($($name:ident),*) => {
         $(
             #[test]
@@ -270,4 +363,5 @@ macro_rules! create_optimal_check_tests {
     }
 }
 
-create_optimal_check_tests!(check0, check1, check2, check3, check4, check5, check6, check7);
+    create_optimal_check_tests!(check0, check1, check2, check3, check4, check5, check6, check7);
+}