summaryrefslogtreecommitdiffstats
path: root/third_party/rust/jsparagus-parser/src/simulator.rs
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 09:22:09 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 09:22:09 +0000
commit43a97878ce14b72f0981164f87f2e35e14151312 (patch)
tree620249daf56c0258faa40cbdcf9cfba06de2a846 /third_party/rust/jsparagus-parser/src/simulator.rs
parentInitial commit. (diff)
downloadfirefox-upstream.tar.xz
firefox-upstream.zip
Adding upstream version 110.0.1.upstream/110.0.1upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'third_party/rust/jsparagus-parser/src/simulator.rs')
-rw-r--r--third_party/rust/jsparagus-parser/src/simulator.rs211
1 files changed, 211 insertions, 0 deletions
diff --git a/third_party/rust/jsparagus-parser/src/simulator.rs b/third_party/rust/jsparagus-parser/src/simulator.rs
new file mode 100644
index 0000000000..0e060fd5c1
--- /dev/null
+++ b/third_party/rust/jsparagus-parser/src/simulator.rs
@@ -0,0 +1,211 @@
+//! Simulates parser execution, for a single token of input, without incurring
+//! any side effects.
+//!
+//! This is basically a copy of the parser.rs source code with calls to
+//! generated_parser::reduce, and stack bookkeeping, omitted.
+
+use crate::parser::Parser;
+use arrayvec::ArrayVec;
+use ast::SourceLocation;
+use generated_parser::{
+ noop_actions, ParseError, ParserTrait, Result, StackValue, TermValue, TerminalId, Token, TABLES,
+};
+
+/// The Simulator is used to check whether we can shift one token, either to
+/// check what might be accepted, or to check whether we can End parsing now.
+/// This is used by the REPL to verify whether or not we can end the input.
+pub struct Simulator<'alloc, 'parser> {
+ /// Define the top of the immutable stack.
+ sp: usize,
+ /// Immutable state stack coming from the forked parser.
+ state_stack: &'parser [usize],
+ /// Immuatable term stack coming from the forked parser.
+ node_stack: &'parser [TermValue<StackValue<'alloc>>],
+ /// Mutable state stack used by the simulator on top of the immutable
+ /// parser's state stack.
+ ///
+ /// Uses a fixed-size array as the number of lookahead is bounded to a lower
+ /// value, panics otherwise.
+ sim_state_stack: ArrayVec<usize, 4>,
+ /// Mutable term stack used by the simulator on top of the immutable
+ /// parser's term stack.
+ ///
+ /// Uses a fixed-size array as the number of lookahead is bounded to a lower
+ /// value, panics otherwise.
+ sim_node_stack: ArrayVec<TermValue<()>, 4>,
+ /// Mutable term stack used by the simulator for replaying terms when
+ /// reducing non-terminals are replaying lookahead terminals.
+ ///
+ /// Uses a fixed-size array as the number of lookahead is bounded to a lower
+ /// value, panics otherwise.
+ replay_stack: ArrayVec<TermValue<()>, 4>,
+}
+
+impl<'alloc, 'parser> ParserTrait<'alloc, ()> for Simulator<'alloc, 'parser> {
+ fn shift(&mut self, tv: TermValue<()>) -> Result<'alloc, bool> {
+ // Shift the new terminal/nonterminal and its associated value.
+ let mut state = self.state();
+ assert!(state < TABLES.shift_count);
+ let mut tv = tv;
+ loop {
+ let term_index: usize = tv.term.into();
+ assert!(term_index < TABLES.shift_width);
+ let index = state * TABLES.shift_width + term_index;
+ let goto = TABLES.shift_table[index];
+ if goto < 0 {
+ // Error handling is in charge of shifting an ErrorSymbol from the
+ // current state.
+ self.try_error_handling(tv)?;
+ tv = self.replay_stack.pop().unwrap();
+ continue;
+ }
+ state = goto as usize;
+ self.sim_state_stack.push(state);
+ self.sim_node_stack.push(tv);
+ // Execute any actions, such as reduce actions.
+ if state >= TABLES.shift_count {
+ assert!(state < TABLES.action_count + TABLES.shift_count);
+ if noop_actions(self, state)? {
+ return Ok(true);
+ }
+ state = self.state();
+ }
+ assert!(state < TABLES.shift_count);
+ if let Some(tv_temp) = self.replay_stack.pop() {
+ tv = tv_temp;
+ } else {
+ break;
+ }
+ }
+ Ok(false)
+ }
+ fn shift_replayed(&mut self, state: usize) {
+ let tv = self.replay_stack.pop().unwrap();
+ self.sim_state_stack.push(state);
+ self.sim_node_stack.push(tv);
+ }
+ fn unshift(&mut self) {
+ let tv = self.pop();
+ self.replay(tv)
+ }
+ fn pop(&mut self) -> TermValue<()> {
+ if let Some(s) = self.sim_node_stack.pop() {
+ self.sim_state_stack.pop();
+ return s;
+ }
+ let t = self.node_stack[self.sp - 1].term;
+ self.sp -= 1;
+ TermValue { term: t, value: () }
+ }
+ fn replay(&mut self, tv: TermValue<()>) {
+ self.replay_stack.push(tv)
+ }
+ fn epsilon(&mut self, state: usize) {
+ if self.sim_state_stack.is_empty() {
+ self.sim_state_stack.push(self.state_stack[self.sp]);
+ self.sim_node_stack.push(TermValue {
+ term: self.node_stack[self.sp - 1].term,
+ value: (),
+ });
+ self.sp -= 1;
+ }
+ *self.sim_state_stack.last_mut().unwrap() = state;
+ }
+ fn top_state(&self) -> usize {
+ self.state()
+ }
+ fn check_not_on_new_line(&mut self, _peek: usize) -> Result<'alloc, bool> {
+ Ok(true)
+ }
+}
+
+impl<'alloc, 'parser> Simulator<'alloc, 'parser> {
+ pub fn new(
+ state_stack: &'parser [usize],
+ node_stack: &'parser [TermValue<StackValue<'alloc>>],
+ ) -> Simulator<'alloc, 'parser> {
+ let sp = state_stack.len() - 1;
+ assert_eq!(state_stack.len(), node_stack.len() + 1);
+ Simulator {
+ sp,
+ state_stack,
+ node_stack,
+ sim_state_stack: ArrayVec::new(),
+ sim_node_stack: ArrayVec::new(),
+ replay_stack: ArrayVec::new(),
+ }
+ }
+
+ fn state(&self) -> usize {
+ if let Some(res) = self.sim_state_stack.last() {
+ *res
+ } else {
+ self.state_stack[self.sp]
+ }
+ }
+
+ pub fn write_token(&mut self, t: TerminalId) -> Result<'alloc, ()> {
+ // Shift the token with the associated StackValue.
+ let accept = self.shift(TermValue {
+ term: t.into(),
+ value: (),
+ })?;
+ // JavaScript grammar accepts empty inputs, therefore we can never
+ // accept any program before receiving a TerminalId::End.
+ assert!(!accept);
+ Ok(())
+ }
+
+ pub fn close(&mut self, _position: usize) -> Result<'alloc, ()> {
+ // Shift the End terminal with the associated StackValue.
+ let accept = self.shift(TermValue {
+ term: TerminalId::End.into(),
+ value: (),
+ })?;
+ // Adding a TerminalId::End would either lead to a parse error, or to
+ // accepting the current input. In which case we return matching node
+ // value.
+ assert!(accept);
+
+ // We can either reduce a Script/Module, or a Script/Module followed by
+ // an <End> terminal.
+ assert!(self.sp + self.sim_node_stack.len() >= 1);
+ Ok(())
+ }
+
+ // Simulate the action of Parser::try_error_handling.
+ fn try_error_handling(&mut self, t: TermValue<()>) -> Result<'alloc, bool> {
+ if t.term.is_terminal() {
+ let term = t.term.to_terminal();
+ let bogus_loc = SourceLocation::new(0, 0);
+ let token = &Token::basic_token(term, bogus_loc);
+
+ // Error tokens might them-self cause more errors to be reported.
+ // This happens due to the fact that the ErrorToken can be replayed,
+ // and while the ErrorToken might be in the lookahead rules, it
+ // might not be in the shifted terms coming after the reduced
+ // nonterminal.
+ if term == TerminalId::ErrorToken {
+ return Err(Parser::parse_error(token).into());
+ }
+
+ // Otherwise, check if the current rule accept an Automatic
+ // Semi-Colon insertion (ASI).
+ let state = self.state();
+ assert!(state < TABLES.shift_count);
+ let error_code = TABLES.error_codes[state];
+ if let Some(error_code) = error_code {
+ Parser::recover(token, error_code)?;
+ self.replay(t);
+ self.replay(TermValue {
+ term: TerminalId::ErrorToken.into(),
+ value: (),
+ });
+ return Ok(false);
+ }
+ return Err(Parser::parse_error(token).into());
+ }
+ // On error, don't attempt error handling again.
+ Err(ParseError::ParserCannotUnpackToken.into())
+ }
+}