]> git.proxmox.com Git - cargo.git/blob - vendor/regex-syntax/src/hir/visitor.rs
New upstream version 0.52.0
[cargo.git] / vendor / regex-syntax / src / hir / visitor.rs
1 use crate::hir::{self, Hir, HirKind};
2
3 /// A trait for visiting the high-level IR (HIR) in depth first order.
4 ///
5 /// The principle aim of this trait is to enable callers to perform case
6 /// analysis on a high-level intermediate representation of a regular
7 /// expression without necessarily using recursion. In particular, this permits
8 /// callers to do case analysis with constant stack usage, which can be
9 /// important since the size of an HIR may be proportional to end user input.
10 ///
11 /// Typical usage of this trait involves providing an implementation and then
12 /// running it using the [`visit`](fn.visit.html) function.
13 pub trait Visitor {
14 /// The result of visiting an HIR.
15 type Output;
16 /// An error that visiting an HIR might return.
17 type Err;
18
19 /// All implementors of `Visitor` must provide a `finish` method, which
20 /// yields the result of visiting the HIR or an error.
21 fn finish(self) -> Result<Self::Output, Self::Err>;
22
23 /// This method is called before beginning traversal of the HIR.
24 fn start(&mut self) {}
25
26 /// This method is called on an `Hir` before descending into child `Hir`
27 /// nodes.
28 fn visit_pre(&mut self, _hir: &Hir) -> Result<(), Self::Err> {
29 Ok(())
30 }
31
32 /// This method is called on an `Hir` after descending all of its child
33 /// `Hir` nodes.
34 fn visit_post(&mut self, _hir: &Hir) -> Result<(), Self::Err> {
35 Ok(())
36 }
37
38 /// This method is called between child nodes of an alternation.
39 fn visit_alternation_in(&mut self) -> Result<(), Self::Err> {
40 Ok(())
41 }
42 }
43
44 /// Executes an implementation of `Visitor` in constant stack space.
45 ///
46 /// This function will visit every node in the given `Hir` while calling
47 /// appropriate methods provided by the
48 /// [`Visitor`](trait.Visitor.html) trait.
49 ///
50 /// The primary use case for this method is when one wants to perform case
51 /// analysis over an `Hir` without using a stack size proportional to the depth
52 /// of the `Hir`. Namely, this method will instead use constant stack space,
53 /// but will use heap space proportional to the size of the `Hir`. This may be
54 /// desirable in cases where the size of `Hir` is proportional to end user
55 /// input.
56 ///
57 /// If the visitor returns an error at any point, then visiting is stopped and
58 /// the error is returned.
59 pub fn visit<V: Visitor>(hir: &Hir, visitor: V) -> Result<V::Output, V::Err> {
60 HeapVisitor::new().visit(hir, visitor)
61 }
62
63 /// HeapVisitor visits every item in an `Hir` recursively using constant stack
64 /// size and a heap size proportional to the size of the `Hir`.
65 struct HeapVisitor<'a> {
66 /// A stack of `Hir` nodes. This is roughly analogous to the call stack
67 /// used in a typical recursive visitor.
68 stack: Vec<(&'a Hir, Frame<'a>)>,
69 }
70
71 /// Represents a single stack frame while performing structural induction over
72 /// an `Hir`.
73 enum Frame<'a> {
74 /// A stack frame allocated just before descending into a repetition
75 /// operator's child node.
76 Repetition(&'a hir::Repetition),
77 /// A stack frame allocated just before descending into a group's child
78 /// node.
79 Group(&'a hir::Group),
80 /// The stack frame used while visiting every child node of a concatenation
81 /// of expressions.
82 Concat {
83 /// The child node we are currently visiting.
84 head: &'a Hir,
85 /// The remaining child nodes to visit (which may be empty).
86 tail: &'a [Hir],
87 },
88 /// The stack frame used while visiting every child node of an alternation
89 /// of expressions.
90 Alternation {
91 /// The child node we are currently visiting.
92 head: &'a Hir,
93 /// The remaining child nodes to visit (which may be empty).
94 tail: &'a [Hir],
95 },
96 }
97
98 impl<'a> HeapVisitor<'a> {
99 fn new() -> HeapVisitor<'a> {
100 HeapVisitor { stack: vec![] }
101 }
102
103 fn visit<V: Visitor>(
104 &mut self,
105 mut hir: &'a Hir,
106 mut visitor: V,
107 ) -> Result<V::Output, V::Err> {
108 self.stack.clear();
109
110 visitor.start();
111 loop {
112 visitor.visit_pre(hir)?;
113 if let Some(x) = self.induct(hir) {
114 let child = x.child();
115 self.stack.push((hir, x));
116 hir = child;
117 continue;
118 }
119 // No induction means we have a base case, so we can post visit
120 // it now.
121 visitor.visit_post(hir)?;
122
123 // At this point, we now try to pop our call stack until it is
124 // either empty or we hit another inductive case.
125 loop {
126 let (post_hir, frame) = match self.stack.pop() {
127 None => return visitor.finish(),
128 Some((post_hir, frame)) => (post_hir, frame),
129 };
130 // If this is a concat/alternate, then we might have additional
131 // inductive steps to process.
132 if let Some(x) = self.pop(frame) {
133 if let Frame::Alternation { .. } = x {
134 visitor.visit_alternation_in()?;
135 }
136 hir = x.child();
137 self.stack.push((post_hir, x));
138 break;
139 }
140 // Otherwise, we've finished visiting all the child nodes for
141 // this HIR, so we can post visit it now.
142 visitor.visit_post(post_hir)?;
143 }
144 }
145 }
146
147 /// Build a stack frame for the given HIR if one is needed (which occurs if
148 /// and only if there are child nodes in the HIR). Otherwise, return None.
149 fn induct(&mut self, hir: &'a Hir) -> Option<Frame<'a>> {
150 match *hir.kind() {
151 HirKind::Repetition(ref x) => Some(Frame::Repetition(x)),
152 HirKind::Group(ref x) => Some(Frame::Group(x)),
153 HirKind::Concat(ref x) if x.is_empty() => None,
154 HirKind::Concat(ref x) => {
155 Some(Frame::Concat { head: &x[0], tail: &x[1..] })
156 }
157 HirKind::Alternation(ref x) if x.is_empty() => None,
158 HirKind::Alternation(ref x) => {
159 Some(Frame::Alternation { head: &x[0], tail: &x[1..] })
160 }
161 _ => None,
162 }
163 }
164
165 /// Pops the given frame. If the frame has an additional inductive step,
166 /// then return it, otherwise return `None`.
167 fn pop(&self, induct: Frame<'a>) -> Option<Frame<'a>> {
168 match induct {
169 Frame::Repetition(_) => None,
170 Frame::Group(_) => None,
171 Frame::Concat { tail, .. } => {
172 if tail.is_empty() {
173 None
174 } else {
175 Some(Frame::Concat { head: &tail[0], tail: &tail[1..] })
176 }
177 }
178 Frame::Alternation { tail, .. } => {
179 if tail.is_empty() {
180 None
181 } else {
182 Some(Frame::Alternation {
183 head: &tail[0],
184 tail: &tail[1..],
185 })
186 }
187 }
188 }
189 }
190 }
191
192 impl<'a> Frame<'a> {
193 /// Perform the next inductive step on this frame and return the next
194 /// child HIR node to visit.
195 fn child(&self) -> &'a Hir {
196 match *self {
197 Frame::Repetition(rep) => &rep.hir,
198 Frame::Group(group) => &group.hir,
199 Frame::Concat { head, .. } => head,
200 Frame::Alternation { head, .. } => head,
201 }
202 }
203 }