2024-04-24 11:07:38 +02:00
|
|
|
use drop_bomb::DropBomb;
|
|
|
|
|
2024-06-03 10:53:59 +02:00
|
|
|
use self::{
|
|
|
|
error::SyntaxError,
|
|
|
|
events::{Event, NodeKind},
|
|
|
|
input::Input,
|
|
|
|
syntax_kind::SyntaxKind,
|
|
|
|
};
|
|
|
|
use std::cell::Cell;
|
2024-04-24 11:07:38 +02:00
|
|
|
|
|
|
|
pub mod syntax_kind;
|
2024-04-03 00:30:11 +02:00
|
|
|
#[cfg(test)]
|
|
|
|
mod tests;
|
2024-04-24 11:07:38 +02:00
|
|
|
|
|
|
|
pub mod error;
|
|
|
|
pub mod events;
|
|
|
|
pub mod grammar;
|
|
|
|
pub mod input;
|
|
|
|
pub mod output;
|
|
|
|
|
2024-06-03 10:53:59 +02:00
|
|
|
const PARSER_STEP_LIMIT: u32 = 4096;
|
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
pub struct Parser<'src, 'toks> {
|
|
|
|
input: Input<'src, 'toks>,
|
|
|
|
pos: usize,
|
|
|
|
events: Vec<Event>,
|
2024-06-03 10:53:59 +02:00
|
|
|
steps: Cell<u32>,
|
2024-04-03 00:08:00 +02:00
|
|
|
}
|
2024-04-24 11:07:38 +02:00
|
|
|
|
|
|
|
impl<'src, 'toks> Parser<'src, 'toks> {
|
|
|
|
pub fn new(input: Input<'src, 'toks>) -> Self {
|
|
|
|
Self {
|
|
|
|
input,
|
|
|
|
pos: 0,
|
|
|
|
events: Vec::new(),
|
2024-06-03 10:53:59 +02:00
|
|
|
steps: Cell::new(0),
|
2024-04-03 00:08:00 +02:00
|
|
|
}
|
2024-04-24 11:07:38 +02:00
|
|
|
}
|
|
|
|
|
2024-06-03 10:53:59 +02:00
|
|
|
pub fn finish(self) -> Vec<Event> {
|
|
|
|
self.events
|
2024-04-24 11:07:38 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn nth(&self, n: usize) -> SyntaxKind {
|
2024-06-03 10:53:59 +02:00
|
|
|
self.step();
|
2024-04-24 11:07:38 +02:00
|
|
|
self.input.kind(self.pos + n)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn eat_succeeding_ws(&mut self) {
|
|
|
|
self.push_ev(Event::Eat {
|
|
|
|
count: self.input.meaningless_tail_len(),
|
2024-04-11 03:23:03 +02:00
|
|
|
});
|
2024-04-24 11:07:38 +02:00
|
|
|
}
|
2024-04-11 03:23:03 +02:00
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
pub(crate) fn current(&self) -> SyntaxKind {
|
2024-06-03 10:53:59 +02:00
|
|
|
self.step();
|
2024-04-24 11:07:38 +02:00
|
|
|
self.input.kind(self.pos)
|
|
|
|
}
|
2024-04-11 03:23:03 +02:00
|
|
|
|
2024-04-24 19:55:16 +02:00
|
|
|
pub(crate) fn start(&mut self, name: &str) -> Marker {
|
2024-04-24 11:07:38 +02:00
|
|
|
let pos = self.events.len();
|
|
|
|
self.push_ev(Event::tombstone());
|
2024-04-24 19:55:16 +02:00
|
|
|
Marker::new(pos, name)
|
2024-04-24 11:07:38 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn at(&self, kind: SyntaxKind) -> bool {
|
|
|
|
self.nth_at(0, kind)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn eat(&mut self, kind: SyntaxKind) -> bool {
|
|
|
|
if !self.at(kind) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
self.do_bump();
|
|
|
|
true
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn nth_at(&self, n: usize, kind: SyntaxKind) -> bool {
|
|
|
|
self.nth(n) == kind
|
|
|
|
}
|
|
|
|
|
|
|
|
fn do_bump(&mut self) {
|
|
|
|
self.push_ev(Event::Eat {
|
|
|
|
count: self.input.preceding_meaningless(self.pos),
|
|
|
|
});
|
|
|
|
self.pos += 1;
|
|
|
|
}
|
2024-04-11 03:23:03 +02:00
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
fn push_ev(&mut self, event: Event) {
|
|
|
|
self.events.push(event)
|
|
|
|
}
|
2024-06-03 10:53:59 +02:00
|
|
|
|
|
|
|
fn step(&self) {
|
|
|
|
let steps = self.steps.get();
|
|
|
|
assert!(steps <= PARSER_STEP_LIMIT, "the parser seems stuck...");
|
|
|
|
self.steps.set(steps + 1);
|
|
|
|
}
|
2024-04-03 00:08:00 +02:00
|
|
|
}
|
2024-04-08 14:04:52 +02:00
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
pub(crate) struct Marker {
|
|
|
|
pos: usize,
|
|
|
|
bomb: DropBomb,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Marker {
|
2024-04-24 19:55:16 +02:00
|
|
|
pub(crate) fn new(pos: usize, name: &str) -> Self {
|
2024-04-24 11:07:38 +02:00
|
|
|
Self {
|
|
|
|
pos,
|
2024-04-24 19:55:16 +02:00
|
|
|
bomb: DropBomb::new(format!("Marker {name} must be completed or abandoned")),
|
2024-04-24 11:07:38 +02:00
|
|
|
}
|
|
|
|
}
|
2024-04-24 19:37:52 +02:00
|
|
|
|
2024-06-03 11:22:36 +02:00
|
|
|
fn close_node(mut self, p: &mut Parser, kind: NodeKind) -> CompletedMarker {
|
2024-04-24 11:07:38 +02:00
|
|
|
self.bomb.defuse();
|
|
|
|
match &mut p.events[self.pos] {
|
2024-06-03 10:53:59 +02:00
|
|
|
Event::Start { kind: slot, .. } => *slot = kind.clone(),
|
2024-04-24 11:07:38 +02:00
|
|
|
_ => unreachable!(),
|
|
|
|
}
|
2024-06-03 10:53:59 +02:00
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
p.push_ev(Event::Finish);
|
|
|
|
|
|
|
|
CompletedMarker {
|
|
|
|
pos: self.pos,
|
|
|
|
kind,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-06-03 10:53:59 +02:00
|
|
|
pub(crate) fn complete(self, p: &mut Parser<'_, '_>, kind: SyntaxKind) -> CompletedMarker {
|
2024-06-03 11:22:36 +02:00
|
|
|
self.close_node(p, NodeKind::Syntax(kind))
|
2024-06-03 10:53:59 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn error(self, p: &mut Parser, kind: SyntaxError) -> CompletedMarker {
|
2024-06-03 11:22:36 +02:00
|
|
|
self.close_node(p, NodeKind::Error(kind))
|
2024-04-24 19:37:52 +02:00
|
|
|
}
|
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
pub(crate) fn abandon(mut self, p: &mut Parser<'_, '_>) {
|
|
|
|
self.bomb.defuse();
|
|
|
|
if self.pos == p.events.len() - 1 {
|
|
|
|
match p.events.pop() {
|
|
|
|
Some(Event::Start {
|
2024-06-03 10:53:59 +02:00
|
|
|
kind: NodeKind::Syntax(SyntaxKind::TOMBSTONE),
|
2024-04-24 11:07:38 +02:00
|
|
|
forward_parent: None,
|
|
|
|
}) => (),
|
|
|
|
_ => unreachable!(),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) struct CompletedMarker {
|
|
|
|
pos: usize,
|
2024-06-03 10:53:59 +02:00
|
|
|
kind: NodeKind,
|
2024-04-24 11:07:38 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl CompletedMarker {
|
2024-04-30 12:21:06 +02:00
|
|
|
pub(crate) fn precede(self, p: &mut Parser<'_, '_>, name: &str) -> Marker {
|
|
|
|
let new_pos = p.start(name);
|
2024-04-24 11:07:38 +02:00
|
|
|
|
|
|
|
match &mut p.events[self.pos] {
|
|
|
|
Event::Start { forward_parent, .. } => {
|
|
|
|
*forward_parent = Some(new_pos.pos - self.pos);
|
|
|
|
}
|
|
|
|
_ => unreachable!(),
|
|
|
|
}
|
2024-04-08 14:04:52 +02:00
|
|
|
|
2024-04-24 11:07:38 +02:00
|
|
|
new_pos
|
|
|
|
}
|
2024-04-08 14:04:52 +02:00
|
|
|
}
|