From 87abf6e262c242d899c8f4e0fa5b4fdc4b9731e5 Mon Sep 17 00:00:00 2001 From: Lut99 Date: Tue, 22 Oct 2024 10:59:58 +0200 Subject: [PATCH] `Visitor` and `VisitorMut` can now optimize recursion for linear connections This to avoid Brane WIR-like problems with long, linear workflows that cause the stack to overflow. --- lib/reasoners/posix/src/workflow.rs | 8 +- lib/workflow/src/visitor.rs | 247 +++++++++++++++++++++++----- 2 files changed, 208 insertions(+), 47 deletions(-) diff --git a/lib/reasoners/posix/src/workflow.rs b/lib/reasoners/posix/src/workflow.rs index 376429c..10fb365 100644 --- a/lib/reasoners/posix/src/workflow.rs +++ b/lib/reasoners/posix/src/workflow.rs @@ -4,7 +4,7 @@ // Created: // 11 Oct 2024, 16:54:04 // Last edited: -// 18 Oct 2024, 11:27:06 +// 22 Oct 2024, 10:54:08 // Auto updated? // Yes // @@ -17,7 +17,7 @@ use std::sync::LazyLock; use tracing::{debug, span, Level}; use workflow::visitor::Visitor; -use workflow::{Dataset, ElemCall, Entity, Workflow}; +use workflow::{Dataset, Elem, ElemCall, Entity, Workflow}; /***** CONSTANTS *****/ @@ -85,7 +85,7 @@ impl<'w> Visitor<'w> for DatasetCollector<'w> { // self.write_sets.extend(repeat(location).zip(stop_sets.iter().cloned())); // } - fn visit_call(&mut self, elem: &'w ElemCall) -> Result<(), Self::Error> { + fn visit_call(&mut self, elem: &'w ElemCall) -> Result, Self::Error> { // We take a more simplified view on dataset reading/writing. // We consider a task's inputs as READING. Any task's outputs are WRITING. @@ -110,7 +110,7 @@ impl<'w> Visitor<'w> for DatasetCollector<'w> { } // Also visit the next one before returning, lol - self.visit(&elem.next) + Ok(Some(&elem.next)) } } diff --git a/lib/workflow/src/visitor.rs b/lib/workflow/src/visitor.rs index 0ec21ff..d6cb418 100644 --- a/lib/workflow/src/visitor.rs +++ b/lib/workflow/src/visitor.rs @@ -4,7 +4,7 @@ // Created: // 08 Oct 2024, 17:35:03 // Last edited: -// 14 Oct 2024, 11:55:45 +// 22 Oct 2024, 10:59:10 // Auto updated? // Yes // @@ -37,16 +37,43 @@ pub trait Visitor<'w> { /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. - fn visit(&mut self, elem: &'w Elem) -> Result<(), Self::Error> { - match elem { - Elem::Call(c) => self.visit_call(c), - - Elem::Branch(b) => self.visit_branch(b), - Elem::Parallel(p) => self.visit_parallel(p), - Elem::Loop(l) => self.visit_loop(l), - - Elem::Next => self.visit_next(), - Elem::Stop => self.visit_stop(), + fn visit(&mut self, mut elem: &'w Elem) -> Result<(), Self::Error> { + loop { + match elem { + Elem::Call(c) => match self.visit_call(c) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + + Elem::Branch(b) => match self.visit_branch(b) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + Elem::Parallel(p) => match self.visit_parallel(p) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + Elem::Loop(l) => match self.visit_loop(l) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + + // Note: these can never return a next + Elem::Next => return self.visit_next(), + Elem::Stop => return self.visit_stop(), + } } } @@ -55,30 +82,54 @@ pub trait Visitor<'w> { /// /// The default implementation doesn't do anything meaningful besides visiting the next node. /// + /// Usually, you don't call this function directly. Call [`Visitor::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemCall`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`Visitor::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_call(&mut self, elem: &'w ElemCall) -> Result<(), Self::Error> { self.visit(&elem.next) } + fn visit_call(&mut self, elem: &'w ElemCall) -> Result, Self::Error> { Ok(Some(&elem.next)) } /// Visits an [`Elem::Branch`]. /// /// The default implementation doesn't do anything meaningful besides visiting the branches, /// and then the next node. /// + /// Usually, you don't call this function directly. Call [`Visitor::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemBranch`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`Visitor::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_branch(&mut self, elem: &'w ElemBranch) -> Result<(), Self::Error> { + fn visit_branch(&mut self, elem: &'w ElemBranch) -> Result, Self::Error> { for b in &elem.branches { self.visit(b)?; } - self.visit(&elem.next) + Ok(Some(&elem.next)) } /// Visits an [`Elem::Parallel`]. @@ -86,17 +137,29 @@ pub trait Visitor<'w> { /// The default implementation doesn't do anything meaningful besides visiting the branches, /// and then the next node. /// + /// Usually, you don't call this function directly. Call [`Visitor::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemParallel`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`Visitor::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_parallel(&mut self, elem: &'w ElemParallel) -> Result<(), Self::Error> { + fn visit_parallel(&mut self, elem: &'w ElemParallel) -> Result, Self::Error> { for b in &elem.branches { self.visit(b)?; } - self.visit(&elem.next) + Ok(Some(&elem.next)) } /// Visits an [`Elem::Loop`]. @@ -110,9 +173,9 @@ pub trait Visitor<'w> { /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_loop(&mut self, elem: &'w ElemLoop) -> Result<(), Self::Error> { + fn visit_loop(&mut self, elem: &'w ElemLoop) -> Result, Self::Error> { self.visit(&elem.body)?; - self.visit(&elem.next) + Ok(Some(&elem.next)) } @@ -141,16 +204,16 @@ impl<'a, 'w, T: Visitor<'w>> Visitor<'w> for &'a mut T { fn visit(&mut self, elem: &'w Elem) -> Result<(), Self::Error> { T::visit(self, elem) } #[inline] - fn visit_call(&mut self, elem: &'w ElemCall) -> Result<(), Self::Error> { T::visit_call(self, elem) } + fn visit_call(&mut self, elem: &'w ElemCall) -> Result, Self::Error> { T::visit_call(self, elem) } #[inline] - fn visit_branch(&mut self, elem: &'w ElemBranch) -> Result<(), Self::Error> { T::visit_branch(self, elem) } + fn visit_branch(&mut self, elem: &'w ElemBranch) -> Result, Self::Error> { T::visit_branch(self, elem) } #[inline] - fn visit_parallel(&mut self, elem: &'w ElemParallel) -> Result<(), Self::Error> { T::visit_parallel(self, elem) } + fn visit_parallel(&mut self, elem: &'w ElemParallel) -> Result, Self::Error> { T::visit_parallel(self, elem) } #[inline] - fn visit_loop(&mut self, elem: &'w ElemLoop) -> Result<(), Self::Error> { T::visit_loop(self, elem) } + fn visit_loop(&mut self, elem: &'w ElemLoop) -> Result, Self::Error> { T::visit_loop(self, elem) } #[inline] fn visit_next(&mut self) -> Result<(), Self::Error> { T::visit_next(self) } @@ -180,16 +243,42 @@ pub trait VisitorMut<'w> { /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. - fn visit(&mut self, elem: &'w mut Elem) -> Result<(), Self::Error> { - match elem { - Elem::Call(c) => self.visit_call(c), - - Elem::Branch(b) => self.visit_branch(b), - Elem::Parallel(p) => self.visit_parallel(p), - Elem::Loop(l) => self.visit_loop(l), - - Elem::Next => self.visit_next(), - Elem::Stop => self.visit_stop(), + fn visit(&mut self, mut elem: &'w mut Elem) -> Result<(), Self::Error> { + loop { + match elem { + Elem::Call(c) => match self.visit_call(c) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + + Elem::Branch(b) => match self.visit_branch(b) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + Elem::Parallel(p) => match self.visit_parallel(p) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + Elem::Loop(l) => match self.visit_loop(l) { + Ok(Some(next)) => { + elem = next; + }, + Ok(None) => return Ok(()), + Err(err) => return Err(err), + }, + + Elem::Next => return self.visit_next(), + Elem::Stop => return self.visit_stop(), + } } } @@ -198,30 +287,54 @@ pub trait VisitorMut<'w> { /// /// The default implementation doesn't do anything meaningful besides visiting the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorMut::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemCall`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`VisitorMut::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_call(&mut self, elem: &'w mut ElemCall) -> Result<(), Self::Error> { self.visit(&mut elem.next) } + fn visit_call(&mut self, elem: &'w mut ElemCall) -> Result, Self::Error> { Ok(Some(&mut elem.next)) } /// Visits an [`Elem::Branch`]. /// /// The default implementation doesn't do anything meaningful besides visiting the branches, /// and then the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorMut::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemBranch`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`VisitorMut::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_branch(&mut self, elem: &'w mut ElemBranch) -> Result<(), Self::Error> { + fn visit_branch(&mut self, elem: &'w mut ElemBranch) -> Result, Self::Error> { for b in &mut elem.branches { self.visit(b)?; } - self.visit(&mut elem.next) + Ok(Some(&mut elem.next)) } /// Visits an [`Elem::Parallel`]. @@ -229,17 +342,29 @@ pub trait VisitorMut<'w> { /// The default implementation doesn't do anything meaningful besides visiting the branches, /// and then the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorMut::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemParallel`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`VisitorMut::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_parallel(&mut self, elem: &'w mut ElemParallel) -> Result<(), Self::Error> { + fn visit_parallel(&mut self, elem: &'w mut ElemParallel) -> Result, Self::Error> { for b in &mut elem.branches { self.visit(b)?; } - self.visit(&mut elem.next) + Ok(Some(&mut elem.next)) } /// Visits an [`Elem::Loop`]. @@ -247,15 +372,27 @@ pub trait VisitorMut<'w> { /// The default implementation doesn't do anything meaningful besides visiting the body, and /// then the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorMut::visit()`] instead to + /// traverse a node. If you do call it manually, take care to process the + /// [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemLoop`]. /// + /// # Returns + /// This function can return the reference to a new [`Elem`] to traverse to. + /// + /// Implementations can do so when there is a "next" element to traverse that happens after all + /// visiting for this element is done. If so, then returning it instead of calling + /// [`VisitorMut::visit()`] manually saves stack space because it is traversed by iteration + /// instead of recursion. + /// /// # Errors /// If this visitor fails, then the whole visiting processes is terminated. #[inline] - fn visit_loop(&mut self, elem: &'w mut ElemLoop) -> Result<(), Self::Error> { + fn visit_loop(&mut self, elem: &'w mut ElemLoop) -> Result, Self::Error> { self.visit(&mut elem.body)?; - self.visit(&mut elem.next) + Ok(Some(&mut elem.next)) } @@ -284,16 +421,16 @@ impl<'a, 'w, T: VisitorMut<'w>> VisitorMut<'w> for &'a mut T { fn visit(&mut self, elem: &'w mut Elem) -> Result<(), Self::Error> { T::visit(self, elem) } #[inline] - fn visit_call(&mut self, elem: &'w mut ElemCall) -> Result<(), Self::Error> { T::visit_call(self, elem) } + fn visit_call(&mut self, elem: &'w mut ElemCall) -> Result, Self::Error> { T::visit_call(self, elem) } #[inline] - fn visit_branch(&mut self, elem: &'w mut ElemBranch) -> Result<(), Self::Error> { T::visit_branch(self, elem) } + fn visit_branch(&mut self, elem: &'w mut ElemBranch) -> Result, Self::Error> { T::visit_branch(self, elem) } #[inline] - fn visit_parallel(&mut self, elem: &'w mut ElemParallel) -> Result<(), Self::Error> { T::visit_parallel(self, elem) } + fn visit_parallel(&mut self, elem: &'w mut ElemParallel) -> Result, Self::Error> { T::visit_parallel(self, elem) } #[inline] - fn visit_loop(&mut self, elem: &'w mut ElemLoop) -> Result<(), Self::Error> { T::visit_loop(self, elem) } + fn visit_loop(&mut self, elem: &'w mut ElemLoop) -> Result, Self::Error> { T::visit_loop(self, elem) } #[inline] fn visit_next(&mut self) -> Result<(), Self::Error> { T::visit_next(self) } @@ -361,6 +498,10 @@ pub trait VisitorOwned { /// /// The default implementation doesn't do anything meaningful besides visiting the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorOwned::visit()`] or + /// [`VisitorOwned::visit_mut()`] instead to traverse a node. If you do call it manually, take + /// care to process the [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemCall`]. /// @@ -380,6 +521,10 @@ pub trait VisitorOwned { /// The default implementation doesn't do anything meaningful besides visiting the branches, /// and then the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorOwned::visit()`] or + /// [`VisitorOwned::visit_mut()`] instead to traverse a node. If you do call it manually, take + /// care to process the [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemBranch`]. /// @@ -402,6 +547,10 @@ pub trait VisitorOwned { /// The default implementation doesn't do anything meaningful besides visiting the branches, /// and then the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorOwned::visit()`] or + /// [`VisitorOwned::visit_mut()`] instead to traverse a node. If you do call it manually, take + /// care to process the [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemParallel`]. /// @@ -424,6 +573,10 @@ pub trait VisitorOwned { /// The default implementation doesn't do anything meaningful besides visiting the body, and /// then the next node. /// + /// Usually, you don't call this function directly. Call [`VisitorOwned::visit()`] or + /// [`VisitorOwned::visit_mut()`] instead to traverse a node. If you do call it manually, take + /// care to process the [returned value](#returns) correctly. + /// /// # Arguments /// - `elem`: The visited [`ElemLoop`]. /// @@ -444,6 +597,10 @@ pub trait VisitorOwned { /// /// The default implementation doesn't do anything meaningful. /// + /// Usually, you don't call this function directly. Call [`VisitorOwned::visit()`] or + /// [`VisitorOwned::visit_mut()`] instead to traverse a node. If you do call it manually, take + /// care to process the [returned value](#returns) correctly. + /// /// # Returns /// An [`Elem::Next`] (i.e., nothing is replaced). /// @@ -456,6 +613,10 @@ pub trait VisitorOwned { /// /// The default implementation doesn't do anything meaningful. /// + /// Usually, you don't call this function directly. Call [`VisitorOwned::visit()`] or + /// [`VisitorOwned::visit_mut()`] instead to traverse a node. If you do call it manually, take + /// care to process the [returned value](#returns) correctly. + /// /// # Returns /// An [`Elem::Stop`] (i.e., nothing is replaced). ///