diff --git a/hugr-core/src/hugr/patch/inline_dfg.rs b/hugr-core/src/hugr/patch/inline_dfg.rs
index bc14ae8af1..f5a3653ee4 100644
--- a/hugr-core/src/hugr/patch/inline_dfg.rs
+++ b/hugr-core/src/hugr/patch/inline_dfg.rs
@@ -3,36 +3,37 @@
 //! and deleting the DFG along with its Input + Output
 
 use super::{PatchHugrMut, PatchVerification};
+use crate::core::HugrNode;
 use crate::ops::handle::{DfgID, NodeHandle};
 use crate::{HugrView, IncomingPort, Node, OutgoingPort, PortIndex};
 
 /// Structure identifying an `InlineDFG` rewrite from the spec
-pub struct InlineDFG(pub DfgID);
+pub struct InlineDFG<N = Node>(pub DfgID<N>);
 
 /// Errors from an [`InlineDFG`] rewrite.
 #[derive(Clone, Debug, PartialEq, Eq, thiserror::Error)]
 #[non_exhaustive]
-pub enum InlineDFGError {
+pub enum InlineDFGError<N = Node> {
     /// Node to inline was not a DFG. (E.g. node has been overwritten since the `DfgID` originated.)
     #[error("{node} was not a DFG")]
     NotDFG {
         /// The node we tried to inline
-        node: Node,
+        node: N,
     },
     /// The DFG node is the hugr entrypoint
     #[error("Cannot inline the entrypoint node, {node}")]
     CantInlineEntrypoint {
         /// The node we tried to inline
-        node: Node,
+        node: N,
     },
 }
 
-impl PatchVerification for InlineDFG {
-    type Error = InlineDFGError;
+impl<N: HugrNode> PatchVerification for InlineDFG<N> {
+    type Error = InlineDFGError<N>;
 
-    type Node = Node;
+    type Node = N;
 
-    fn verify(&self, h: &impl crate::HugrView<Node = Node>) -> Result<(), Self::Error> {
+    fn verify(&self, h: &impl crate::HugrView<Node = N>) -> Result<(), Self::Error> {
         let n = self.0.node();
         if h.get_optype(n).as_dfg().is_none() {
             return Err(InlineDFGError::NotDFG { node: n });
@@ -51,15 +52,15 @@ impl PatchVerification for InlineDFG {
     }
 }
 
-impl PatchHugrMut for InlineDFG {
+impl<N: HugrNode> PatchHugrMut for InlineDFG<N> {
     /// The removed nodes: the DFG, and its Input and Output children.
-    type Outcome = [Node; 3];
+    type Outcome = [N; 3];
 
     const UNCHANGED_ON_FAILURE: bool = true;
 
     fn apply_hugr_mut(
         self,
-        h: &mut impl crate::hugr::HugrMut<Node = Node>,
+        h: &mut impl crate::hugr::HugrMut<Node = N>,
     ) -> Result<Self::Outcome, Self::Error> {
         self.verify(h)?;
         let n = self.0.node();
diff --git a/hugr-core/src/ops/tag.rs b/hugr-core/src/ops/tag.rs
index 2834cd94eb..f329bcb7b9 100644
--- a/hugr-core/src/ops/tag.rs
+++ b/hugr-core/src/ops/tag.rs
@@ -9,7 +9,7 @@ use std::{cmp, fmt::Display};
 ///
 /// Uses a flat representation for all the variants, in contrast to the complex
 /// `OpType` structures.
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Default)]
+#[derive(Debug, Clone, Copy, Hash, PartialEq, Eq, Default)]
 #[non_exhaustive]
 pub enum OpTag {
     /// All operations allowed.
diff --git a/hugr-passes/src/lib.rs b/hugr-passes/src/lib.rs
index 6e97f3422e..2a0cbb01a5 100644
--- a/hugr-passes/src/lib.rs
+++ b/hugr-passes/src/lib.rs
@@ -17,10 +17,34 @@ pub use inline_funcs::inline_acyclic;
 pub mod linearize_array;
 pub use linearize_array::LinearizeArrayPass;
 pub mod lower;
-pub mod merge_bbs;
 mod monomorphize;
+pub mod normalize_cfgs;
 pub mod untuple;
 
+/// Merge basic blocks. Subset of [normalize_cfgs], use the latter.
+#[deprecated(note = "Use normalize_cfgs", since = "0.23.0")]
+pub mod merge_bbs {
+    use hugr_core::hugr::{hugrmut::HugrMut, views::RootCheckable};
+    use hugr_core::ops::handle::CfgID;
+
+    /// Merge any basic blocks that are direct children of the specified CFG
+    /// i.e. where a basic block B has a single successor B' whose only predecessor
+    /// is B, B and B' can be combined.
+    ///
+    /// # Panics
+    ///
+    /// If the `entrypoint` of `cfg` is not an [OpType::CFG]
+    ///
+    /// [OpType::CFG]: hugr_core::ops::OpType::CFG
+    #[deprecated(note = "Use version in normalize_cfgs", since = "0.23.0")]
+    pub fn merge_basic_blocks<'h, H: 'h + HugrMut>(
+        cfg: impl RootCheckable<&'h mut H, CfgID<H::Node>>,
+    ) {
+        let checked = cfg.try_into_checked().expect("Hugr must be a CFG region");
+        super::normalize_cfgs::merge_basic_blocks(checked.into_hugr()).unwrap();
+    }
+}
+
 pub use monomorphize::{MonomorphizePass, mangle_name, monomorphize};
 pub mod replace_types;
 pub use replace_types::ReplaceTypes;
diff --git a/hugr-passes/src/merge_bbs.rs b/hugr-passes/src/merge_bbs.rs
deleted file mode 100644
index 3c6d9c9b2d..0000000000
--- a/hugr-passes/src/merge_bbs.rs
+++ /dev/null
@@ -1,384 +0,0 @@
-//! Merge BBs along control-flow edges where the source BB has no other successors
-//! and the target BB has no other predecessors.
-use std::collections::HashMap;
-
-use hugr_core::extension::prelude::UnpackTuple;
-use hugr_core::hugr::hugrmut::HugrMut;
-use hugr_core::hugr::views::RootCheckable;
-use itertools::Itertools;
-
-use hugr_core::hugr::patch::inline_dfg::InlineDFG;
-use hugr_core::hugr::patch::replace::{NewEdgeKind, NewEdgeSpec, Replacement};
-use hugr_core::ops::handle::CfgID;
-use hugr_core::ops::{DFG, DataflowBlock, DataflowParent, Input, Output};
-use hugr_core::{Hugr, HugrView, Node};
-
-/// Merge any basic blocks that are direct children of the specified CFG
-/// i.e. where a basic block B has a single successor B' whose only predecessor
-/// is B, B and B' can be combined.
-pub fn merge_basic_blocks<'h, H>(cfg: impl RootCheckable<&'h mut H, CfgID>)
-where
-    H: 'h + HugrMut<Node = Node>,
-{
-    let checked = cfg.try_into_checked().expect("Hugr must be a CFG region");
-    let cfg = checked.into_hugr();
-
-    let mut worklist = cfg.children(cfg.entrypoint()).collect::<Vec<_>>();
-    while let Some(n) = worklist.pop() {
-        // Consider merging n with its successor
-        let Ok(succ) = cfg.output_neighbours(n).exactly_one() else {
-            continue;
-        };
-        if cfg.input_neighbours(succ).count() != 1 {
-            continue;
-        }
-        if cfg.children(cfg.entrypoint()).take(2).contains(&succ) {
-            // If succ is...
-            //   - the entry block, that has an implicit extra in-edge, so cannot merge with n.
-            //   - the exit block, nodes in n should move *outside* the CFG - a separate pass.
-            continue;
-        }
-        let (rep, merge_bb, dfgs) = mk_rep(cfg, n, succ);
-        let node_map = cfg.apply_patch(rep).unwrap();
-        let merged_bb = *node_map.get(&merge_bb).unwrap();
-        for dfg_id in dfgs {
-            let n_id = *node_map.get(&dfg_id).unwrap();
-            cfg.apply_patch(InlineDFG(n_id.into())).unwrap();
-        }
-        worklist.push(merged_bb);
-    }
-}
-
-fn mk_rep(
-    cfg: &impl HugrView<Node = Node>,
-    pred: Node,
-    succ: Node,
-) -> (Replacement, Node, [Node; 2]) {
-    let pred_ty = cfg.get_optype(pred).as_dataflow_block().unwrap();
-    let succ_ty = cfg.get_optype(succ).as_dataflow_block().unwrap();
-    let succ_sig = succ_ty.inner_signature();
-
-    // Make a Hugr with just a single CFG root node having the same signature.
-    let mut replacement: Hugr = Hugr::new_with_entrypoint(cfg.entrypoint_optype().clone())
-        .expect("Replacement should have a CFG entrypoint");
-
-    let merged = replacement.add_node_with_parent(replacement.entrypoint(), {
-        DataflowBlock {
-            inputs: pred_ty.inputs.clone(),
-            ..succ_ty.clone()
-        }
-    });
-    let input = replacement.add_node_with_parent(
-        merged,
-        Input {
-            types: pred_ty.inputs.clone(),
-        },
-    );
-    let output = replacement.add_node_with_parent(
-        merged,
-        Output {
-            types: succ_sig.output.clone(),
-        },
-    );
-
-    let dfg1 = replacement.add_node_with_parent(
-        merged,
-        DFG {
-            signature: pred_ty.inner_signature().into_owned(),
-        },
-    );
-    for (i, _) in pred_ty.inputs.iter().enumerate() {
-        replacement.connect(input, i, dfg1, i);
-    }
-
-    let dfg2 = replacement.add_node_with_parent(
-        merged,
-        DFG {
-            signature: succ_sig.as_ref().clone(),
-        },
-    );
-    for (i, _) in succ_sig.output.iter().enumerate() {
-        replacement.connect(dfg2, i, output, i);
-    }
-
-    // At the junction, must unpack the first (tuple, branch predicate) output
-    let tuple_elems = pred_ty.sum_rows.clone().into_iter().exactly_one().unwrap();
-    let unp = replacement.add_node_with_parent(merged, UnpackTuple::new(tuple_elems.clone()));
-    replacement.connect(dfg1, 0, unp, 0);
-    let other_start = tuple_elems.len();
-    for (i, _) in tuple_elems.iter().enumerate() {
-        replacement.connect(unp, i, dfg2, i);
-    }
-    for (i, _) in pred_ty.other_outputs.iter().enumerate() {
-        replacement.connect(dfg1, i + 1, dfg2, i + other_start);
-    }
-    // If there are edges from succ back to pred, we cannot do these via the mu_inp/out/new
-    // edge-maps as both source and target of the new edge are in the replacement Hugr
-    for (_, src_pos) in cfg.all_linked_outputs(pred).filter(|(src, _)| *src == succ) {
-        replacement.connect(merged, src_pos, merged, 0);
-    }
-    let rep = Replacement {
-        removal: vec![pred, succ],
-        replacement,
-        adoptions: HashMap::from([(dfg1, pred), (dfg2, succ)]),
-        mu_inp: cfg
-            .all_linked_outputs(pred)
-            .filter(|(src, _)| *src != succ)
-            .map(|(src, src_pos)| NewEdgeSpec {
-                src,
-                tgt: merged,
-                kind: NewEdgeKind::ControlFlow { src_pos },
-            })
-            .collect(),
-        mu_out: cfg
-            .node_outputs(succ)
-            .filter_map(|src_pos| {
-                let tgt = cfg
-                    .linked_inputs(succ, src_pos)
-                    .exactly_one()
-                    .ok()
-                    .unwrap()
-                    .0;
-                if tgt == pred {
-                    None
-                } else {
-                    Some(NewEdgeSpec {
-                        src: merged,
-                        tgt,
-                        kind: NewEdgeKind::ControlFlow { src_pos },
-                    })
-                }
-            })
-            .collect(),
-        mu_new: vec![],
-    };
-    (rep, merged, [dfg1, dfg2])
-}
-
-#[cfg(test)]
-mod test {
-    use std::collections::HashSet;
-    use std::sync::Arc;
-
-    use hugr_core::extension::prelude::PRELUDE_ID;
-    use itertools::Itertools;
-    use rstest::rstest;
-
-    use hugr_core::builder::{CFGBuilder, DFGWrapper, Dataflow, HugrBuilder, endo_sig, inout_sig};
-    use hugr_core::extension::prelude::{ConstUsize, qb_t, usize_t};
-    use hugr_core::ops::constant::Value;
-    use hugr_core::ops::{LoadConstant, OpTrait, OpType};
-    use hugr_core::types::{Signature, Type, TypeRow};
-    use hugr_core::{Extension, Hugr, HugrView, Wire, const_extension_ids, type_row};
-
-    use super::merge_basic_blocks;
-
-    const_extension_ids! {
-        const EXT_ID: ExtensionId = "TestExt";
-    }
-
-    fn extension() -> Arc<Extension> {
-        Extension::new_arc(
-            EXT_ID,
-            hugr_core::extension::Version::new(0, 1, 0),
-            |ext, extension_ref| {
-                ext.add_op(
-                    "Test".into(),
-                    String::new(),
-                    Signature::new(
-                        vec![qb_t(), usize_t()],
-                        TypeRow::from(vec![Type::new_sum(vec![vec![qb_t()], vec![usize_t()]])]),
-                    ),
-                    extension_ref,
-                )
-                .unwrap();
-            },
-        )
-    }
-
-    fn unary_unit_sum<B: AsMut<Hugr> + AsRef<Hugr>, T>(b: &mut DFGWrapper<B, T>) -> Wire {
-        b.add_load_value(Value::unary_unit_sum())
-    }
-
-    #[rstest]
-    #[case(true)]
-    #[case(false)]
-    fn in_loop(#[case] self_loop: bool) -> Result<(), Box<dyn std::error::Error>> {
-        /* self_loop==False:
-           -> Noop1 -----> Test -> Exit       -> Noop1AndTest --> Exit
-               |            |            =>     /            \
-               \-<- Noop2 <-/                   \-<- Noop2 <-/
-           (Noop2 -> Noop1 cannot be merged because Noop1 is the entry node)
-
-           self_loop==True:
-           -> Noop --> Test -> Exit           -> NoopAndTest --> Exit
-               |        |                =>     /           \
-               \--<--<--/                       \--<-----<--/
-        */
-
-        use hugr_core::extension::prelude::Noop;
-        let loop_variants: TypeRow = vec![qb_t()].into();
-        let exit_types: TypeRow = vec![usize_t()].into();
-        let e = extension();
-        let tst_op = e.instantiate_extension_op("Test", [])?;
-        let mut h = CFGBuilder::new(inout_sig(loop_variants.clone(), exit_types.clone()))?;
-        let mut no_b1 = h.simple_entry_builder(loop_variants.clone(), 1)?;
-        let n = no_b1.add_dataflow_op(Noop::new(qb_t()), no_b1.input_wires())?;
-        let br = unary_unit_sum(&mut no_b1);
-        let no_b1 = no_b1.finish_with_outputs(br, n.outputs())?;
-        let mut test_block = h.block_builder(
-            loop_variants.clone(),
-            vec![loop_variants.clone(), exit_types],
-            type_row![],
-        )?;
-        let [test_input] = test_block.input_wires_arr();
-        let usize_cst = test_block.add_load_value(ConstUsize::new(1));
-        let [tst] = test_block
-            .add_dataflow_op(tst_op, [test_input, usize_cst])?
-            .outputs_arr();
-        let test_block = test_block.finish_with_outputs(tst, [])?;
-        let loop_backedge_target = if self_loop {
-            no_b1
-        } else {
-            let mut no_b2 = h.simple_block_builder(endo_sig(loop_variants), 1)?;
-            let n = no_b2.add_dataflow_op(Noop::new(qb_t()), no_b2.input_wires())?;
-            let br = unary_unit_sum(&mut no_b2);
-            let nid = no_b2.finish_with_outputs(br, n.outputs())?;
-            h.branch(&nid, 0, &no_b1)?;
-            nid
-        };
-        h.branch(&no_b1, 0, &test_block)?;
-        h.branch(&test_block, 0, &loop_backedge_target)?;
-        h.branch(&test_block, 1, &h.exit_block())?;
-
-        let mut h = h.finish_hugr()?;
-        let r = h.entrypoint();
-        merge_basic_blocks(&mut h);
-        h.validate().unwrap();
-        assert_eq!(r, h.entrypoint());
-        assert!(matches!(h.get_optype(r), OpType::CFG(_)));
-        let [entry, exit] = h
-            .children(r)
-            .take(2)
-            .collect::<Vec<_>>()
-            .try_into()
-            .unwrap();
-        // Check the Noop('s) is/are in the right block(s)
-        let nops = h
-            .entry_descendants()
-            .filter(|n| h.get_optype(*n).cast::<Noop>().is_some());
-        let (entry_nop, expected_backedge_target) = if self_loop {
-            assert_eq!(h.children(r).count(), 2);
-            (nops.exactly_one().ok().unwrap(), entry)
-        } else {
-            let [_, _, no_b2] = h.children(r).collect::<Vec<_>>().try_into().unwrap();
-            let mut nops = nops.collect::<Vec<_>>();
-            let entry_nop_idx = nops
-                .iter()
-                .position(|n| h.get_parent(*n) == Some(entry))
-                .unwrap();
-            let entry_nop = nops[entry_nop_idx];
-            nops.remove(entry_nop_idx);
-            let [n_op2] = nops.try_into().unwrap();
-            assert_eq!(h.get_parent(n_op2), Some(no_b2));
-            (entry_nop, no_b2)
-        };
-        assert_eq!(h.get_parent(entry_nop), Some(entry));
-        assert_eq!(
-            h.output_neighbours(entry).collect::<HashSet<_>>(),
-            HashSet::from([expected_backedge_target, exit])
-        );
-        // And the Noop in the entry block is consumed by the custom Test op
-        let tst = find_unique(
-            h.entry_descendants(),
-            |n| matches!(h.get_optype(*n), OpType::ExtensionOp(c) if c.def().extension_id() != &PRELUDE_ID),
-        );
-        assert_eq!(h.get_parent(tst), Some(entry));
-        assert_eq!(
-            h.output_neighbours(entry_nop).collect::<Vec<_>>(),
-            vec![tst]
-        );
-        Ok(())
-    }
-
-    #[test]
-    fn triple_with_permute() -> Result<(), Box<dyn std::error::Error>> {
-        // Blocks are just BB1 -> BB2 -> BB3 --> Exit.
-        // CFG Normalization would move everything outside the CFG and elide the CFG altogether,
-        // but this is an easy-to-construct test of merge-basic-blocks only (no CFG normalization).
-        let e = extension();
-        let tst_op: OpType = e.instantiate_extension_op("Test", &[])?.into();
-        let [res_t] = tst_op
-            .dataflow_signature()
-            .unwrap()
-            .into_owned()
-            .output
-            .into_owned()
-            .try_into()
-            .unwrap();
-        let mut h = CFGBuilder::new(inout_sig(qb_t(), res_t.clone()))?;
-        let mut bb1 = h.simple_entry_builder(vec![usize_t(), qb_t()].into(), 1)?;
-        let [inw] = bb1.input_wires_arr();
-        let load_cst = bb1.add_load_value(ConstUsize::new(1));
-        let pred = unary_unit_sum(&mut bb1);
-        let bb1 = bb1.finish_with_outputs(pred, [load_cst, inw])?;
-
-        let mut bb2 = h.block_builder(
-            vec![usize_t(), qb_t()].into(),
-            vec![type_row![]],
-            vec![qb_t(), usize_t()].into(),
-        )?;
-        let [u, q] = bb2.input_wires_arr();
-        let pred = unary_unit_sum(&mut bb2);
-        let bb2 = bb2.finish_with_outputs(pred, [q, u])?;
-
-        let mut bb3 = h.block_builder(
-            vec![qb_t(), usize_t()].into(),
-            vec![type_row![]],
-            res_t.clone().into(),
-        )?;
-        let [q, u] = bb3.input_wires_arr();
-        let tst = bb3.add_dataflow_op(tst_op, [q, u])?;
-        let pred = unary_unit_sum(&mut bb3);
-        let bb3 = bb3.finish_with_outputs(pred, tst.outputs())?;
-        // Now add control-flow edges between basic blocks
-        h.branch(&bb1, 0, &bb2)?;
-        h.branch(&bb2, 0, &bb3)?;
-        h.branch(&bb3, 0, &h.exit_block())?;
-
-        let mut h = h.finish_hugr()?;
-        merge_basic_blocks(&mut h);
-        h.validate()?;
-
-        // Should only be one BB left
-        let [bb, _exit] = h
-            .children(h.entrypoint())
-            .collect::<Vec<_>>()
-            .try_into()
-            .unwrap();
-        let tst = find_unique(
-            h.entry_descendants(),
-            |n| matches!(h.get_optype(*n), OpType::ExtensionOp(c) if c.def().extension_id() != &PRELUDE_ID),
-        );
-        assert_eq!(h.get_parent(tst), Some(bb));
-
-        let inp = find_unique(h.entry_descendants(), |n| {
-            matches!(h.get_optype(*n), OpType::Input(_))
-        });
-        let mut tst_inputs = h.input_neighbours(tst).collect::<Vec<_>>();
-        tst_inputs.remove(tst_inputs.iter().find_position(|n| **n == inp).unwrap().0);
-        let [other_input] = tst_inputs.try_into().unwrap();
-        assert_eq!(
-            h.get_optype(other_input),
-            &(LoadConstant {
-                datatype: usize_t()
-            }
-            .into())
-        );
-        Ok(())
-    }
-
-    fn find_unique<T>(items: impl Iterator<Item = T>, pred: impl Fn(&T) -> bool) -> T {
-        items.filter(pred).exactly_one().ok().unwrap()
-    }
-}
diff --git a/hugr-passes/src/normalize_cfgs.rs b/hugr-passes/src/normalize_cfgs.rs
new file mode 100644
index 0000000000..7599f6928b
--- /dev/null
+++ b/hugr-passes/src/normalize_cfgs.rs
@@ -0,0 +1,994 @@
+//! CFG normalizations.
+//!
+//! * Merge BBs along control-flow edges where the source BB has no other successors
+//!   and the target BB has no other predecessors.
+//! * Move entry/last-before-exit blocks outside of CFG when possible.
+//! * Convert whole CFG to DFG if straight-line control-flow
+use std::collections::HashMap;
+
+use hugr_core::extension::prelude::UnpackTuple;
+use hugr_core::hugr::hugrmut::HugrMut;
+use hugr_core::types::{EdgeKind, Signature, TypeRow};
+use itertools::Itertools;
+
+use hugr_core::hugr::patch::inline_dfg::InlineDFG;
+use hugr_core::hugr::patch::replace::{NewEdgeKind, NewEdgeSpec, Replacement};
+use hugr_core::ops::{
+    CFG, DFG, DataflowBlock, DataflowParent, ExitBlock, Input, OpTag, OpTrait, OpType, Output,
+};
+use hugr_core::{Direction, Hugr, HugrView, Node, OutgoingPort, PortIndex};
+
+use crate::ComposablePass;
+
+/// Merge any basic blocks that are direct children of the specified [`CFG`]-entrypoint
+/// Hugr.
+///
+/// That is, where a basic block B has a single successor B' whose only predecessor
+/// is B, B and B' can be combined.
+///
+/// Returns the number of merged blocks.
+///
+/// # Errors
+///
+/// [NormalizeCFGError::NotCFG] If the entrypoint is not a CFG
+pub fn merge_basic_blocks<H: HugrMut>(cfg: &mut H) -> Result<usize, NormalizeCFGError> {
+    if !cfg.entrypoint_optype().is_cfg() {
+        return Err(NormalizeCFGError::NotCFG(cfg.entrypoint_optype().tag()));
+    }
+    let mut num_merged = 0;
+    let mut worklist = cfg.children(cfg.entrypoint()).collect::<Vec<_>>();
+    while let Some(n) = worklist.pop() {
+        // Consider merging n with its successor
+        let Ok(succ) = cfg.output_neighbours(n).exactly_one() else {
+            continue;
+        };
+        if cfg.input_neighbours(succ).count() != 1 {
+            continue;
+        }
+        if cfg.children(cfg.entrypoint()).take(2).contains(&succ) {
+            // If succ is...
+            //   - the entry block, that has an implicit extra in-edge, so cannot merge with n.
+            //   - the exit block, nodes in n should move *outside* the CFG - a separate pass.
+            continue;
+        }
+        num_merged += 1;
+        let (rep, merge_bb, dfgs) = mk_rep(cfg, n, succ);
+        let node_map = cfg.apply_patch(rep).unwrap();
+        let merged_bb = *node_map.get(&merge_bb).unwrap();
+        for dfg_id in dfgs {
+            let n_id = *node_map.get(&dfg_id).unwrap();
+            cfg.apply_patch(InlineDFG(n_id.into())).unwrap();
+        }
+        worklist.push(merged_bb);
+    }
+    Ok(num_merged)
+}
+
+/// Errors from [normalize_cfg]
+#[derive(Clone, Debug, thiserror::Error, PartialEq, Eq)]
+pub enum NormalizeCFGError {
+    /// The requested node was not a CFG
+    #[error("Requested node was not a CFG but {_0}")]
+    NotCFG(OpTag),
+}
+
+/// Result from [normalize_cfg], i.e. a report of what changes were made to the Hugr.
+///
+/// `N` is the type of the nodes in the Hugr.
+#[derive(Clone, Debug, PartialEq, Eq)]
+pub enum NormalizeCFGResult<N = Node> {
+    /// The entire [`CFG`] was converted into a [`DFG`].
+    ///
+    /// The entrypoint node id is preserved after the conversion, but now identifies
+    /// the new [`DFG`].
+    CFGToDFG,
+    /// The CFG was preserved, but the entry or exit blocks may have changed.
+    CFGPreserved {
+        /// If `Some`, the new [DFG] containing what was previously in the entry block
+        entry_dfg: Option<N>,
+        /// If `Some`, the new [DFG] of what was previously in the last block before the exit
+        exit_dfg: Option<N>,
+        /// The number of basic blocks merged together.
+        /// Does not include any lifted to become DFGs outside.
+        num_merged: usize,
+    },
+}
+
+/// A [ComposablePass] that normalizes CFGs (i.e. [normalize_cfg]) in a Hugr.
+#[derive(Clone, Debug)]
+pub struct NormalizeCFGPass<N> {
+    cfgs: Vec<N>,
+}
+
+impl<N> Default for NormalizeCFGPass<N> {
+    fn default() -> Self {
+        Self { cfgs: vec![] }
+    }
+}
+
+impl<N> NormalizeCFGPass<N> {
+    /// Allows mutating the set of CFG nodes that will be normalized.
+    ///
+    /// If empty (the default), all (non-strict) descendants of the [HugrView::entrypoint]
+    /// will be normalized.
+    pub fn cfgs(&mut self) -> &mut Vec<N> {
+        &mut self.cfgs
+    }
+}
+
+impl<H: HugrMut> ComposablePass<H> for NormalizeCFGPass<H::Node> {
+    type Error = NormalizeCFGError;
+
+    /// For each CFG node that was normalized, the [NormalizeCFGResult] for that CFG
+    type Result = HashMap<H::Node, NormalizeCFGResult<H::Node>>;
+
+    fn run(&self, hugr: &mut H) -> Result<Self::Result, Self::Error> {
+        let cfgs = if self.cfgs.is_empty() {
+            let mut v = hugr
+                .entry_descendants()
+                .filter(|n| hugr.get_optype(*n).is_cfg())
+                .collect::<Vec<_>>();
+            // Process inner CFGs first, in case they are removed (if they are in a completely
+            // disconnected block when the Entry node has only the Exit as successor).
+            v.reverse();
+            v
+        } else {
+            self.cfgs.clone()
+        };
+        let mut results = HashMap::new();
+        for cfg in cfgs {
+            let res = normalize_cfg(&mut hugr.with_entrypoint_mut(cfg))?;
+            results.insert(cfg, res);
+        }
+        Ok(results)
+    }
+}
+
+/// Normalize a CFG in a Hugr:
+/// * Merge consecutive basic blocks i.e. where a BB has only a single successor which
+///   has no predecessors
+/// * If the entry block has only one successor, and no predecessors, then move its contents
+///   into a DFG outside/before CFG.
+///    * If that successor is the exit block, then convert the entire CFG to a DFG.
+///      This will be reported via [NormalizeCFGResult::CFGToDFG]
+/// * (Similarly) if the exit block has only one predecessor, then move contents into a DFG
+///   outside/after CFG.
+///
+/// # Errors
+///
+/// [NormalizeCFGError::NotCFG] If the entrypoint is not a CFG
+pub fn normalize_cfg<H: HugrMut>(
+    h: &mut H,
+) -> Result<NormalizeCFGResult<H::Node>, NormalizeCFGError> {
+    let num_merged = merge_basic_blocks(h)?;
+    let cfg_node = h.entrypoint();
+    fn cfg_ty_mut<H: HugrMut>(h: &mut H, n: H::Node) -> &mut CFG {
+        match h.optype_mut(n) {
+            OpType::CFG(cfg) => cfg,
+            _ => unreachable!(), // Checked at entry to normalize_cfg
+        }
+    }
+    // Further normalizations with effects outside the CFG
+    let [entry, exit] = h.children(cfg_node).take(2).collect_array().unwrap();
+    let entry_blk = h.get_optype(entry).as_dataflow_block().unwrap();
+    let cfg_parent = h.get_parent(cfg_node).unwrap();
+    // 1. If the entry block has no predecessors, then we can move contents outside/before the CFG.
+    // However, we only do this if the Entry block has just one successor (i.e. we can remove
+    // the entry block altogether) - an extension would be to do this in other cases, preserving
+    // the Entry block as an empty branch.
+    let mut entry_dfg = None;
+    if let Some(succ) = h
+        .output_neighbours(entry)
+        .exactly_one()
+        .ok()
+        .filter(|_| h.input_neighbours(entry).next().is_none())
+    {
+        if succ == exit {
+            // 1a. Turn the CFG into a DFG containing only what was in the entry block
+            assert_eq!(
+                &Signature::new(
+                    entry_blk.inputs.clone(),
+                    entry_blk.successor_input(0).unwrap()
+                ),
+                h.signature(cfg_node).unwrap().as_ref()
+            );
+            // Annoying here - "while let Some(blk) = cfg.children(...).skip(1).next()" keeps iterator alive
+            let children_to_remove: Vec<_> = h.children(cfg_node).skip(1).collect();
+            for blk in children_to_remove {
+                h.remove_subtree(blk);
+            }
+            while let Some(ch) = h.first_child(entry) {
+                h.set_parent(ch, cfg_node);
+            }
+            h.remove_node(entry);
+            let signature = std::mem::take(&mut cfg_ty_mut(h, cfg_node).signature);
+            let result_tys = signature.output.clone();
+            h.replace_op(cfg_node, OpType::DFG(DFG { signature }));
+            unpack_before_output(h, h.get_io(cfg_node).unwrap()[1], result_tys);
+            return Ok(NormalizeCFGResult::CFGToDFG);
+        }
+        // 1b. Move entry block outside/before the CFG into a DFG; its successor becomes the entry block.
+        let new_cfg_inputs = entry_blk.successor_input(0).unwrap();
+        let dfg = h.add_node_with_parent(
+            cfg_parent,
+            DFG {
+                signature: Signature::new(entry_blk.inputs.clone(), new_cfg_inputs.clone()),
+            },
+        );
+        let [_, entry_output] = h.get_io(entry).unwrap();
+        while let Some(n) = h.first_child(entry) {
+            h.set_parent(n, dfg);
+        }
+        h.move_before_sibling(succ, entry);
+        h.remove_node(entry);
+
+        unpack_before_output(h, entry_output, new_cfg_inputs.clone());
+
+        // Inputs to CFG go directly to DFG
+        for inp in h.node_inputs(cfg_node).collect::<Vec<_>>() {
+            for src in h.linked_outputs(cfg_node, inp).collect::<Vec<_>>() {
+                h.connect(src.0, src.1, dfg, inp.index());
+            }
+            h.disconnect(cfg_node, inp);
+        }
+
+        // Update input ports
+        let cfg_ty = cfg_ty_mut(h, cfg_node);
+        let inputs_to_add = new_cfg_inputs.len() as isize - cfg_ty.signature.input.len() as isize;
+        cfg_ty.signature.input = new_cfg_inputs;
+        h.add_ports(cfg_node, Direction::Incoming, inputs_to_add);
+
+        // Wire outputs of DFG directly to CFG
+        for src in h.node_outputs(dfg).collect::<Vec<_>>() {
+            h.connect(dfg, src, cfg_node, src.index());
+        }
+        entry_dfg = Some(dfg);
+    }
+    // 2. If the exit node has a single predecessor and that predecessor has no other successors...
+    let mut exit_dfg = None;
+    if let Some(pred) = h
+        .input_neighbours(exit)
+        .exactly_one()
+        .ok()
+        .filter(|pred| h.output_neighbours(*pred).count() == 1)
+    {
+        // Code in that predecessor can be moved outside (into a new DFG after the CFG),
+        // and the predecessor deleted
+        let [_, output] = h.get_io(pred).unwrap();
+        let pred_blk = h.get_optype(pred).as_dataflow_block().unwrap();
+        let new_cfg_outs = pred_blk.inner_signature().into_owned().input;
+
+        // new CFG result type and exit block
+        let cfg_ty = cfg_ty_mut(h, cfg_node);
+        let result_tys = std::mem::replace(&mut cfg_ty.signature.output, new_cfg_outs.clone());
+        h.add_ports(
+            cfg_node,
+            Direction::Outgoing,
+            new_cfg_outs.len() as isize - result_tys.len() as isize,
+        );
+
+        *h.optype_mut(pred) = ExitBlock {
+            cfg_outputs: new_cfg_outs.clone(),
+        }
+        .into();
+        debug_assert_eq!(h.num_ports(pred, Direction::Outgoing), 1);
+        h.set_num_ports(pred, 1, 0);
+
+        h.move_before_sibling(pred, exit);
+        h.remove_node(exit);
+        // Move contents into new DFG
+        let dfg = h.add_node_with_parent(
+            cfg_parent,
+            DFG {
+                signature: Signature::new(new_cfg_outs, result_tys.clone()),
+            },
+        );
+        while let Some(n) = h.first_child(pred) {
+            h.set_parent(n, dfg);
+        }
+        unpack_before_output(h, output, result_tys);
+
+        // Move output edges.
+        for p in h.node_outputs(cfg_node).collect_vec() {
+            let tgts = h.linked_inputs(cfg_node, p).collect_vec();
+            h.disconnect(cfg_node, p);
+            for tgt in tgts {
+                h.connect(dfg, p, tgt.0, tgt.1)
+            }
+        }
+        for p in h.node_inputs(dfg).collect_vec() {
+            h.connect(cfg_node, p.index(), dfg, p);
+        }
+        exit_dfg = Some(dfg);
+    }
+    Ok(NormalizeCFGResult::CFGPreserved {
+        entry_dfg,
+        exit_dfg,
+        num_merged,
+    })
+}
+
+fn mk_rep<H: HugrView>(
+    cfg: &H,
+    pred: H::Node,
+    succ: H::Node,
+) -> (Replacement<H::Node>, Node, [Node; 2]) {
+    let pred_ty = cfg.get_optype(pred).as_dataflow_block().unwrap();
+    let succ_ty = cfg.get_optype(succ).as_dataflow_block().unwrap();
+    let succ_sig = succ_ty.inner_signature();
+
+    // Make a Hugr with just a single CFG root node having the same signature.
+    let mut replacement: Hugr = Hugr::new_with_entrypoint(cfg.entrypoint_optype().clone())
+        .expect("Replacement should have a CFG entrypoint");
+
+    let merged = replacement.add_node_with_parent(replacement.entrypoint(), {
+        DataflowBlock {
+            inputs: pred_ty.inputs.clone(),
+            ..succ_ty.clone()
+        }
+    });
+    let input = replacement.add_node_with_parent(
+        merged,
+        Input {
+            types: pred_ty.inputs.clone(),
+        },
+    );
+    let output = replacement.add_node_with_parent(
+        merged,
+        Output {
+            types: succ_sig.output.clone(),
+        },
+    );
+
+    let dfg1 = replacement.add_node_with_parent(
+        merged,
+        DFG {
+            signature: pred_ty.inner_signature().into_owned(),
+        },
+    );
+    for (i, _) in pred_ty.inputs.iter().enumerate() {
+        replacement.connect(input, i, dfg1, i);
+    }
+
+    let dfg2 = replacement.add_node_with_parent(
+        merged,
+        DFG {
+            signature: succ_sig.as_ref().clone(),
+        },
+    );
+    for (i, _) in succ_sig.output.iter().enumerate() {
+        replacement.connect(dfg2, i, output, i);
+    }
+
+    // At the junction, must unpack the first (tuple, branch predicate) output
+    let dfg1_outs = replacement
+        .out_value_types(dfg1)
+        .enumerate()
+        .map(|(i, _)| (dfg1, i.into()))
+        .collect::<Vec<_>>();
+
+    let dfg_order_out = replacement.get_optype(dfg1).other_output_port().unwrap();
+    let order_srcs = (dfg1_outs.is_empty()).then_some((dfg1, dfg_order_out));
+    // Do not add Order edges between DFGs unless there are no value edges
+    wire_unpack_first(&mut replacement, dfg1_outs, order_srcs, dfg2);
+
+    // If there are edges from succ back to pred, we cannot do these via the mu_inp/out/new
+    // edge-maps as both source and target of the new edge are in the replacement Hugr
+    for (_, src_pos) in cfg.all_linked_outputs(pred).filter(|(src, _)| *src == succ) {
+        replacement.connect(merged, src_pos, merged, 0);
+    }
+    let rep = Replacement {
+        removal: vec![pred, succ],
+        replacement,
+        adoptions: HashMap::from([(dfg1, pred), (dfg2, succ)]),
+        mu_inp: cfg
+            .all_linked_outputs(pred)
+            .filter(|(src, _)| *src != succ)
+            .map(|(src, src_pos)| NewEdgeSpec {
+                src,
+                tgt: merged,
+                kind: NewEdgeKind::ControlFlow { src_pos },
+            })
+            .collect(),
+        mu_out: cfg
+            .node_outputs(succ)
+            .filter_map(|src_pos| {
+                let tgt = cfg
+                    .linked_inputs(succ, src_pos)
+                    .exactly_one()
+                    .ok()
+                    .unwrap()
+                    .0;
+                if tgt == pred {
+                    None
+                } else {
+                    Some(NewEdgeSpec {
+                        src: merged,
+                        tgt,
+                        kind: NewEdgeKind::ControlFlow { src_pos },
+                    })
+                }
+            })
+            .collect(),
+        mu_new: vec![],
+    };
+    (rep, merged, [dfg1, dfg2])
+}
+
+type NodePorts<N> = Vec<(N, OutgoingPort)>;
+/// Remove all input wires to `n` and return them in two groups:
+/// the [EdgeKind::Value] inputs, and the [EdgeKind::StateOrder] inputs
+fn take_inputs<H: HugrMut>(h: &mut H, n: H::Node) -> (NodePorts<H::Node>, NodePorts<H::Node>) {
+    let mut values = vec![];
+    let mut orders = vec![];
+    for p in h.node_inputs(n).collect_vec() {
+        let srcs = h.linked_outputs(n, p).collect_vec();
+        h.disconnect(n, p);
+        match h.get_optype(n).port_kind(p) {
+            Some(EdgeKind::Value(_)) => {
+                assert_eq!(srcs.len(), 1);
+                values.extend(srcs);
+            }
+            Some(EdgeKind::StateOrder) => {
+                assert_eq!(orders, []);
+                orders.extend(srcs);
+            }
+            k => panic!("Unexpected port kind: {:?}", k),
+        }
+    }
+    (values, orders)
+}
+
+fn tuple_elems<H: HugrView>(h: &H, n: H::Node, p: OutgoingPort) -> TypeRow {
+    match h.get_optype(n).port_kind(p) {
+        Some(EdgeKind::Value(ty)) => ty.as_sum().unwrap().as_tuple().unwrap().clone(),
+        p => panic!("Expected Value port not {:?}", p),
+    }
+    .try_into()
+    .unwrap()
+}
+
+/// Unpack the first `value_srcs`; wire the unpacked elements and remaining `value_srcs` into
+/// consecutive ports of `dst`. Finally wire `order_srcs` all to the order input of `dst`.
+fn wire_unpack_first<H: HugrMut>(
+    h: &mut H,
+    value_srcs: impl IntoIterator<Item = (H::Node, OutgoingPort)>,
+    order_srcs: impl IntoIterator<Item = (H::Node, OutgoingPort)>,
+    dst: H::Node,
+) {
+    let parent = h.get_parent(dst).unwrap();
+    let mut srcs = value_srcs.into_iter();
+    let src_to_unpack = srcs.next().unwrap();
+    let tuple_tys = tuple_elems(h, src_to_unpack.0, src_to_unpack.1);
+    let tuple_len = tuple_tys.len();
+    let unp = h.add_node_with_parent(parent, UnpackTuple::new(tuple_tys));
+    h.connect(src_to_unpack.0, src_to_unpack.1, unp, 0);
+
+    for i in 0..tuple_len {
+        h.connect(unp, i, dst, i);
+    }
+    assert_eq!(
+        h.get_optype(dst).other_port_kind(Direction::Incoming),
+        Some(EdgeKind::StateOrder)
+    );
+    let order_tgt = h.get_optype(dst).other_input_port().unwrap();
+    for (i, (src, src_p)) in srcs.enumerate() {
+        assert!(i + tuple_len < order_tgt.index());
+        h.connect(src, src_p, dst, i + tuple_len);
+    }
+    for (src, src_p) in order_srcs {
+        h.connect(src, src_p, dst, order_tgt);
+    }
+}
+
+/// Unpack the first input to specified [Output] node and shuffle all the rest along
+fn unpack_before_output<H: HugrMut>(h: &mut H, output_node: H::Node, new_types: TypeRow) {
+    let (values, orders) = take_inputs(h, output_node);
+    let OpType::Output(ou) = h.optype_mut(output_node) else {
+        panic!()
+    };
+    let ports_to_add = new_types.len() as isize - ou.types.len() as isize;
+    ou.types = new_types;
+    h.add_ports(output_node, Direction::Incoming, ports_to_add);
+    wire_unpack_first(h, values, orders, output_node);
+}
+
+#[cfg(test)]
+mod test {
+    use std::collections::HashSet;
+    use std::sync::Arc;
+
+    use hugr_core::extension::simple_op::MakeExtensionOp;
+    use itertools::Itertools;
+    use rstest::rstest;
+
+    use hugr_core::builder::{
+        CFGBuilder, Dataflow, HugrBuilder, SubContainer, endo_sig, inout_sig,
+    };
+    use hugr_core::extension::prelude::{ConstUsize, Noop, PRELUDE_ID, UnpackTuple, qb_t, usize_t};
+    use hugr_core::ops::{LoadConstant, OpTag, OpTrait, OpType, Tag};
+    use hugr_core::ops::{constant::Value, handle::NodeHandle};
+    use hugr_core::types::{Signature, Type, TypeRow};
+    use hugr_core::{Extension, HugrView, const_extension_ids, type_row};
+
+    use super::{NormalizeCFGPass, NormalizeCFGResult, merge_basic_blocks, normalize_cfg};
+    use crate::ComposablePass;
+
+    const_extension_ids! {
+        const EXT_ID: ExtensionId = "TestExt";
+    }
+
+    fn extension() -> Arc<Extension> {
+        Extension::new_arc(
+            EXT_ID,
+            hugr_core::extension::Version::new(0, 1, 0),
+            |ext, extension_ref| {
+                ext.add_op(
+                    "Test".into(),
+                    String::new(),
+                    Signature::new(
+                        vec![qb_t(), usize_t()],
+                        TypeRow::from(vec![Type::new_sum(vec![vec![qb_t()], vec![usize_t()]])]),
+                    ),
+                    extension_ref,
+                )
+                .unwrap();
+            },
+        )
+    }
+
+    #[rstest]
+    #[case(true)]
+    #[case(false)]
+    fn merge_bbs_in_loop(#[case] self_loop: bool) -> Result<(), Box<dyn std::error::Error>> {
+        /* self_loop==False:
+           -> Noop1 -----> Test -> Exit       -> Noop1AndTest --> Exit
+               |            |            =>     /            \
+               \-<- Noop2 <-/                   \-<- Noop2 <-/
+           (Noop2 -> Noop1 cannot be merged because Noop1 is the entry node)
+
+           self_loop==True:
+           -> Noop --> Test -> Exit           -> NoopAndTest --> Exit
+               |        |                =>     /           \
+               \--<--<--/                       \--<-----<--/
+        */
+
+        let loop_variants: TypeRow = vec![qb_t()].into();
+        let exit_types: TypeRow = vec![usize_t()].into();
+        let e = extension();
+        let tst_op = e.instantiate_extension_op("Test", [])?;
+        let mut h = CFGBuilder::new(inout_sig(loop_variants.clone(), exit_types.clone()))?;
+        let mut no_b1 = h.simple_entry_builder(loop_variants.clone(), 1)?;
+        let n = no_b1.add_dataflow_op(Noop::new(qb_t()), no_b1.input_wires())?;
+        let br = no_b1.add_load_value(Value::unary_unit_sum());
+        let no_b1 = no_b1.finish_with_outputs(br, n.outputs())?;
+        let mut test_block = h.block_builder(
+            loop_variants.clone(),
+            vec![loop_variants.clone(), exit_types],
+            type_row![],
+        )?;
+        let [test_input] = test_block.input_wires_arr();
+        let usize_cst = test_block.add_load_value(ConstUsize::new(1));
+        let [tst] = test_block
+            .add_dataflow_op(tst_op, [test_input, usize_cst])?
+            .outputs_arr();
+        let test_block = test_block.finish_with_outputs(tst, [])?;
+        let loop_backedge_target = if self_loop {
+            no_b1
+        } else {
+            let mut no_b2 = h.simple_block_builder(endo_sig(loop_variants), 1)?;
+            let n = no_b2.add_dataflow_op(Noop::new(qb_t()), no_b2.input_wires())?;
+            let br = no_b2.add_load_value(Value::unary_unit_sum());
+            let nid = no_b2.finish_with_outputs(br, n.outputs())?;
+            h.branch(&nid, 0, &no_b1)?;
+            nid
+        };
+        h.branch(&no_b1, 0, &test_block)?;
+        h.branch(&test_block, 0, &loop_backedge_target)?;
+        h.branch(&test_block, 1, &h.exit_block())?;
+
+        let mut h = h.finish_hugr()?;
+        let r = h.entrypoint();
+        let num_merged = merge_basic_blocks(&mut h)?;
+        assert_eq!(num_merged, 1);
+        h.validate().unwrap();
+        assert_eq!(r, h.entrypoint());
+        assert!(matches!(h.get_optype(r), OpType::CFG(_)));
+        let [entry, exit] = h
+            .children(r)
+            .take(2)
+            .collect::<Vec<_>>()
+            .try_into()
+            .unwrap();
+        // Check the Noop('s) is/are in the right block(s)
+        let nops = h
+            .entry_descendants()
+            .filter(|n| h.get_optype(*n).cast::<Noop>().is_some());
+        let (entry_nop, expected_backedge_target) = if self_loop {
+            assert_eq!(h.children(r).count(), 2);
+            (nops.exactly_one().ok().unwrap(), entry)
+        } else {
+            let [_, _, no_b2] = h.children(r).collect::<Vec<_>>().try_into().unwrap();
+            let mut nops = nops.collect::<Vec<_>>();
+            let entry_nop_idx = nops
+                .iter()
+                .position(|n| h.get_parent(*n) == Some(entry))
+                .unwrap();
+            let entry_nop = nops[entry_nop_idx];
+            nops.remove(entry_nop_idx);
+            let [n_op2] = nops.try_into().unwrap();
+            assert_eq!(h.get_parent(n_op2), Some(no_b2));
+            (entry_nop, no_b2)
+        };
+        assert_eq!(h.get_parent(entry_nop), Some(entry));
+        assert_eq!(
+            h.output_neighbours(entry).collect::<HashSet<_>>(),
+            HashSet::from([expected_backedge_target, exit])
+        );
+        // And the Noop in the entry block is consumed by the custom Test op
+        let tst = find_unique(
+            h.entry_descendants(),
+            |n| matches!(h.get_optype(*n), OpType::ExtensionOp(c) if c.def().extension_id() != &PRELUDE_ID),
+        );
+        assert_eq!(h.get_parent(tst), Some(entry));
+        assert_eq!(
+            h.output_neighbours(entry_nop).collect::<Vec<_>>(),
+            vec![tst]
+        );
+        Ok(())
+    }
+
+    #[test]
+    fn elide_triple_with_permute() -> Result<(), Box<dyn std::error::Error>> {
+        // Blocks are just BB1 -> BB2 -> BB3 --> Exit.
+        // Should be merged into one BB (we don't check that specifically)
+        // and then the whole CFG elided.
+        let e = extension();
+        let tst_op: OpType = e.instantiate_extension_op("Test", &[])?.into();
+        let [res_t] = tst_op
+            .dataflow_signature()
+            .unwrap()
+            .into_owned()
+            .output
+            .into_owned()
+            .try_into()
+            .unwrap();
+        let mut h = CFGBuilder::new(inout_sig(qb_t(), res_t.clone()))?;
+        let mut bb1 = h.simple_entry_builder(vec![usize_t(), qb_t()].into(), 1)?;
+        let [inw] = bb1.input_wires_arr();
+        let load_cst = bb1.add_load_value(ConstUsize::new(1));
+        let pred = bb1.add_load_value(Value::unary_unit_sum());
+        let bb1 = bb1.finish_with_outputs(pred, [load_cst, inw])?;
+
+        let mut bb2 = h.block_builder(
+            vec![usize_t(), qb_t()].into(),
+            vec![type_row![]],
+            vec![qb_t(), usize_t()].into(),
+        )?;
+        let [u, q] = bb2.input_wires_arr();
+        let pred = bb2.add_load_value(Value::unary_unit_sum());
+        let bb2 = bb2.finish_with_outputs(pred, [q, u])?;
+
+        let mut bb3 = h.block_builder(
+            vec![qb_t(), usize_t()].into(),
+            vec![type_row![]],
+            res_t.clone().into(),
+        )?;
+        let [q, u] = bb3.input_wires_arr();
+        let tst = bb3.add_dataflow_op(tst_op, [q, u])?;
+        let pred = bb3.add_load_value(Value::unary_unit_sum());
+        let bb3 = bb3.finish_with_outputs(pred, tst.outputs())?;
+        // Now add control-flow edges between basic blocks
+        h.branch(&bb1, 0, &bb2)?;
+        h.branch(&bb2, 0, &bb3)?;
+        h.branch(&bb3, 0, &h.exit_block())?;
+
+        let mut h = h.finish_hugr()?;
+        let res = normalize_cfg(&mut h);
+        assert_eq!(res, Ok(NormalizeCFGResult::CFGToDFG));
+        h.validate()?;
+        assert_eq!(h.entrypoint_optype().tag(), OpTag::Dfg);
+        assert_eq!(
+            h.entry_descendants().find(|n| matches!(
+                h.get_optype(*n),
+                OpType::DataflowBlock(_) | OpType::CFG(_) | OpType::ExitBlock(_)
+            )),
+            None
+        );
+        let tst = find_unique(
+            h.entry_descendants(),
+            |n| matches!(h.get_optype(*n), OpType::ExtensionOp(c) if c.def().extension_id() != &PRELUDE_ID),
+        );
+        assert_eq!(h.get_parent(tst), Some(h.entrypoint()));
+
+        let inp = find_unique(h.entry_descendants(), |n| {
+            matches!(h.get_optype(*n), OpType::Input(_))
+        });
+        let mut tst_inputs = h.input_neighbours(tst).collect::<Vec<_>>();
+        tst_inputs.remove(tst_inputs.iter().find_position(|n| **n == inp).unwrap().0);
+        let [other_input] = tst_inputs.try_into().unwrap();
+        assert_eq!(
+            h.get_optype(other_input),
+            &(LoadConstant {
+                datatype: usize_t()
+            }
+            .into())
+        );
+        Ok(())
+    }
+
+    fn find_unique<T>(items: impl Iterator<Item = T>, pred: impl Fn(&T) -> bool) -> T {
+        items.filter(pred).exactly_one().ok().unwrap()
+    }
+
+    #[test]
+    fn entry_before_loop() -> Result<(), Box<dyn std::error::Error>> {
+        /* -> Noop --> Test -> Exit      -> Test --> Exit
+                       |  |          =>     |  |
+                       \<-/                 \<-/
+        */
+        let loop_variants: TypeRow = vec![qb_t()].into();
+        let exit_types: TypeRow = vec![usize_t()].into();
+        let e = extension();
+        let tst_op = e.instantiate_extension_op("Test", [])?;
+        let mut h = CFGBuilder::new(inout_sig(qb_t(), usize_t()))?;
+        let mut nop_b = h.simple_entry_builder(loop_variants.clone(), 1)?;
+        let n = nop_b.add_dataflow_op(Noop::new(qb_t()), nop_b.input_wires())?;
+        let br = nop_b.add_load_value(Value::unary_unit_sum());
+        let entry = nop_b.finish_with_outputs(br, n.outputs())?;
+
+        let mut loop_b = h.block_builder(
+            loop_variants.clone(),
+            [loop_variants, exit_types],
+            type_row![],
+        )?;
+        let [qb] = loop_b.input_wires_arr();
+        let usz = loop_b.add_load_value(ConstUsize::new(3));
+        let [tst] = loop_b.add_dataflow_op(tst_op, [qb, usz])?.outputs_arr();
+        let loop_ = loop_b.finish_with_outputs(tst, [])?;
+        h.branch(&entry, 0, &loop_)?;
+        h.branch(&loop_, 0, &loop_)?;
+        h.branch(&loop_, 1, &h.exit_block())?;
+
+        let mut h = h.finish_hugr()?;
+
+        let res = normalize_cfg(&mut h).unwrap();
+        h.validate().unwrap();
+        let NormalizeCFGResult::CFGPreserved {
+            entry_dfg: Some(dfg),
+            exit_dfg: None,
+            num_merged: 0,
+        } = res
+        else {
+            panic!("Unexpected result");
+        };
+        assert_eq!(
+            h.children(h.entrypoint())
+                .map(|n| h.get_optype(n).tag())
+                .collect_vec(),
+            [OpTag::DataflowBlock, OpTag::BasicBlockExit]
+        );
+        let func = h.get_parent(h.entrypoint()).unwrap();
+        let func_children = child_tags_ext_ids(&h, func);
+        assert_eq!(
+            func_children.into_iter().sorted().collect_vec(),
+            ["Cfg", "Dfg", "Input", "Output",]
+        );
+        assert_eq!(
+            h.children(func)
+                .filter(|n| h.get_optype(*n).is_dfg())
+                .collect_vec(),
+            [dfg]
+        );
+        assert_eq!(
+            child_tags_ext_ids(&h, dfg)
+                .into_iter()
+                .sorted()
+                .collect_vec(),
+            [
+                "Const",
+                "Input",
+                "LoadConst",
+                "Noop",
+                "Output",
+                "UnpackTuple"
+            ]
+        );
+        Ok(())
+    }
+
+    #[test]
+    fn loop_before_exit() -> Result<(), Box<dyn std::error::Error>> {
+        /* -> Test -> Noop -> Exit      -> Test --> Exit (then Noop)
+              |  |                  =>    |  |
+              \<-/                        \<-/
+        */
+        let loop_variants: TypeRow = vec![qb_t()].into();
+        let exit_types: TypeRow = vec![usize_t()].into();
+        let e = extension();
+        let tst_op = e.instantiate_extension_op("Test", [])?;
+        let mut h = CFGBuilder::new(inout_sig(loop_variants.clone(), exit_types.clone()))?;
+
+        let mut loop_b = h.entry_builder(vec![loop_variants, exit_types.clone()], type_row![])?;
+        let [qb] = loop_b.input_wires_arr();
+        let usz = loop_b.add_load_value(ConstUsize::new(3));
+        let [tst] = loop_b.add_dataflow_op(tst_op, [qb, usz])?.outputs_arr();
+        let loop_ = loop_b.finish_with_outputs(tst, [])?;
+        h.branch(&loop_, 0, &loop_)?;
+
+        let mut nop_b = h.simple_block_builder(endo_sig(exit_types), 1)?;
+        let n = nop_b.add_dataflow_op(Noop::new(usize_t()), nop_b.input_wires())?;
+        let br = nop_b.add_load_value(Value::unary_unit_sum());
+        let tail = nop_b.finish_with_outputs(br, n.outputs())?;
+
+        h.branch(&loop_, 1, &tail)?;
+        h.branch(&tail, 0, &h.exit_block())?;
+
+        let mut h = h.finish_hugr()?;
+        let res = normalize_cfg(&mut h).unwrap();
+        h.validate().unwrap();
+        let NormalizeCFGResult::CFGPreserved {
+            entry_dfg: None,
+            exit_dfg: Some(dfg),
+            num_merged: 0,
+        } = res
+        else {
+            panic!("Unexpected result");
+        };
+        assert_eq!(
+            h.children(h.entrypoint())
+                .map(|n| h.get_optype(n).tag())
+                .collect_vec(),
+            [OpTag::DataflowBlock, OpTag::BasicBlockExit]
+        );
+        let func = h.get_parent(h.entrypoint()).unwrap();
+        assert_eq!(
+            child_tags_ext_ids(&h, func),
+            ["Input", "Output", "Cfg", "Dfg"]
+        );
+
+        assert_eq!(h.children(func).last(), Some(dfg));
+        assert_eq!(
+            child_tags_ext_ids(&h, dfg)
+                .into_iter()
+                .sorted()
+                .collect_vec(),
+            [
+                "Const",
+                "Input",
+                "LoadConst",
+                "Noop",
+                "Output",
+                "UnpackTuple"
+            ]
+        );
+
+        Ok(())
+    }
+
+    #[test]
+    fn nested_cfgs_pass() {
+        //  --> Entry --> Loop --> Tail --> EXIT
+        //        |       /  \
+        //      (E->X)    \<-/
+        let e = extension();
+        let tst_op = e.instantiate_extension_op("Test", []).unwrap();
+        let qqu = vec![qb_t(), qb_t(), usize_t()];
+        let qq = TypeRow::from(vec![qb_t(); 2]);
+        let mut outer = CFGBuilder::new(inout_sig(qqu.clone(), vec![usize_t(), qb_t()])).unwrap();
+        let mut entry = outer.entry_builder(vec![qq.clone()], type_row![]).unwrap();
+        let [q1, q2, u] = entry.input_wires_arr();
+        let (inner, inner_pred) = {
+            let mut inner = entry
+                .cfg_builder([(qb_t(), q1), (qb_t(), q2)], qq.clone())
+                .unwrap();
+            let mut entry = inner.entry_builder(vec![qq.clone()], type_row![]).unwrap();
+            let [q1, q2] = entry.input_wires_arr();
+            let [pred] = entry
+                .add_dataflow_op(Tag::new(0, vec![qq.clone()]), [q1, q2])
+                .unwrap()
+                .outputs_arr();
+            let entry = entry.finish_with_outputs(pred, []).unwrap();
+            inner.branch(&entry, 0, &inner.exit_block()).unwrap();
+            (inner.finish_sub_container().unwrap(), pred.node())
+        };
+        let [q1, q2] = inner.outputs_arr();
+        let [entry_pred] = entry
+            .add_dataflow_op(Tag::new(0, vec![qq.clone()]), [q1, q2])
+            .unwrap()
+            .outputs_arr();
+        let entry = entry.finish_with_outputs(entry_pred, []).unwrap();
+
+        let loop_b = {
+            let mut loop_b = outer
+                .block_builder(qq.clone(), [qb_t().into(), usize_t().into()], qb_t().into())
+                .unwrap();
+            let [q1, q2] = loop_b.input_wires_arr();
+            // u here is `dom` edge from entry block
+            let [pred] = loop_b
+                .add_dataflow_op(tst_op, [q1, u])
+                .unwrap()
+                .outputs_arr();
+            loop_b.finish_with_outputs(pred, [q2]).unwrap()
+        };
+        outer.branch(&entry, 0, &loop_b).unwrap();
+        outer.branch(&loop_b, 0, &loop_b).unwrap();
+
+        let (tail_b, tail_pred) = {
+            let uq = TypeRow::from(vec![usize_t(), qb_t()]);
+            let mut tail_b = outer
+                .block_builder(uq.clone(), vec![uq.clone()], type_row![])
+                .unwrap();
+            let [u, q] = tail_b.input_wires_arr();
+            let [br] = tail_b
+                .add_dataflow_op(Tag::new(0, vec![uq.clone()]), [u, q])
+                .unwrap()
+                .outputs_arr();
+            (tail_b.finish_with_outputs(br, []).unwrap(), br.node())
+        };
+        outer.branch(&loop_b, 1, &tail_b).unwrap();
+        outer.branch(&tail_b, 0, &outer.exit_block()).unwrap();
+        let mut h = outer.finish_hugr().unwrap();
+        assert_eq!(
+            h.get_parent(h.get_parent(inner_pred).unwrap()),
+            Some(inner.node())
+        );
+        assert_eq!(h.get_parent(entry_pred.node()), Some(entry.node()));
+        assert_eq!(h.get_parent(tail_pred.node()), Some(tail_b.node()));
+
+        let mut res = NormalizeCFGPass::default().run(&mut h).unwrap();
+        h.validate().unwrap();
+        assert_eq!(
+            res.remove(&inner.node()),
+            Some(NormalizeCFGResult::CFGToDFG)
+        );
+        let Some(NormalizeCFGResult::CFGPreserved {
+            entry_dfg: Some(entry_dfg),
+            exit_dfg: Some(tail_dfg),
+            num_merged: 0,
+        }) = res.remove(&h.entrypoint())
+        else {
+            panic!("Unexpected result")
+        };
+        assert!(res.is_empty());
+        // Now contains only one CFG with one BB (self-loop)
+        assert_eq!(
+            h.nodes()
+                .filter(|n| h.get_optype(*n).is_cfg())
+                .exactly_one()
+                .ok(),
+            Some(h.entrypoint())
+        );
+        let [entry, exit] = h.children(h.entrypoint()).collect_array().unwrap();
+        assert_eq!(h.output_neighbours(entry).collect_vec(), [entry, exit]);
+        // Inner CFG is now a DFG (and still sibling of entry_pred)...
+        assert_eq!(h.get_parent(inner_pred), Some(inner.node()));
+        assert_eq!(h.get_optype(inner.node()).tag(), OpTag::Dfg);
+        assert_eq!(h.get_parent(inner.node()), h.get_parent(entry_pred.node()));
+        // Predicates lifted appropriately...
+        for (n, parent) in [(entry_pred.node(), entry_dfg), (tail_pred.node(), tail_dfg)] {
+            assert_eq!(h.get_parent(n), Some(parent));
+            assert_eq!(h.get_optype(parent).tag(), OpTag::Dfg);
+            assert_eq!(h.get_parent(parent), h.get_parent(h.entrypoint()));
+        }
+        // ...and followed by UnpackTuple's
+        for n in [inner_pred, entry_pred.node(), tail_pred.node()] {
+            let [unpack] = h.output_neighbours(n).collect_array().unwrap();
+            assert!(
+                h.get_optype(unpack)
+                    .as_extension_op()
+                    .and_then(|e| UnpackTuple::from_extension_op(e).ok())
+                    .is_some()
+            );
+        }
+    }
+
+    fn child_tags_ext_ids<H: HugrView>(h: &H, n: H::Node) -> Vec<String> {
+        h.children(n)
+            .map(|n| match h.get_optype(n) {
+                OpType::ExtensionOp(e) => e.unqualified_id().to_string(),
+                op => format!("{:?}", op.tag()),
+            })
+            .collect()
+    }
+}