jotdown/src/tree.rs

414 lines
11 KiB
Rust
Raw Normal View History

2022-11-12 12:45:17 -05:00
use crate::Span;
2022-11-28 14:12:49 -05:00
#[derive(Debug, Clone, PartialEq, Eq)]
2022-12-10 04:26:06 -05:00
pub enum EventKind<C, A> {
2022-11-28 14:12:49 -05:00
Enter(C),
2022-12-11 14:49:57 -05:00
Inline,
2022-11-28 18:33:43 -05:00
Exit(C),
2022-12-10 04:26:06 -05:00
Atom(A),
2022-11-28 14:12:49 -05:00
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct Event<C, A> {
pub kind: EventKind<C, A>,
pub span: Span,
}
pub struct Tree<C, A>(Box<[Node<C, A>]>);
2022-11-12 12:45:17 -05:00
2022-12-11 12:47:00 -05:00
#[derive(Clone)]
2022-12-11 14:49:57 -05:00
pub struct Inlines<'t, C, A> {
2022-12-11 12:47:00 -05:00
iter: std::slice::Iter<'t, Node<C, A>>,
}
2022-12-11 14:49:57 -05:00
impl<'t, C, A> Iterator for Inlines<'t, C, A> {
2022-12-11 12:47:00 -05:00
type Item = Span;
fn next(&mut self) -> Option<Self::Item> {
self.iter.next().map(|n| n.span)
}
}
2022-12-12 12:22:13 -05:00
impl<C, A> Tree<C, A> {
pub fn root(&self) -> Branch<C, A> {
let head = self.0[NodeIndex::root().index()].next;
// SAFETY: tree must outlive the branch
let nodes = unsafe { std::mem::transmute::<&[Node<C, A>], &'static [Node<C, A>]>(&self.0) };
Branch {
2022-11-28 14:19:22 -05:00
nodes,
branch: Vec::new(),
2022-12-08 11:42:54 -05:00
head,
2022-11-28 14:19:22 -05:00
}
2022-11-12 12:45:17 -05:00
}
}
2022-12-08 11:42:54 -05:00
#[derive(Clone)]
pub struct Branch<C: 'static, A: 'static> {
nodes: &'static [Node<C, A>],
branch: Vec<NodeIndex>,
head: Option<NodeIndex>,
}
2022-12-11 12:47:00 -05:00
impl<C, A> Branch<C, A> {
2023-01-18 16:30:24 -05:00
pub fn empty() -> Self {
Self {
nodes: &[],
branch: Vec::new(),
head: None,
}
}
2023-01-18 15:44:58 -05:00
/// Count number of direct children nodes.
pub fn count_children(&self) -> usize {
let mut head = self.head;
let mut count = 0;
while let Some(h) = head {
let n = &self.nodes[h.index()];
head = n.next;
count += 1;
}
count
}
pub fn take_branch(&mut self) -> Self {
let head = self.head.take();
self.head = self.branch.pop();
if let Some(h) = self.head {
let n = &self.nodes[h.index()];
self.head = n.next;
}
Self {
nodes: self.nodes,
branch: Vec::new(),
head,
}
}
/// Retrieve all inlines until the end of the current container. Panics if any upcoming node is
/// not an inline node.
pub fn take_inlines(&mut self) -> impl Iterator<Item = Span> + '_ {
let mut head = self.head.take();
2022-12-08 11:42:54 -05:00
std::iter::from_fn(move || {
head.take().map(|h| {
let n = &self.nodes[h.index()];
assert!(matches!(n.kind, NodeKind::Inline));
2022-12-08 11:42:54 -05:00
head = n.next;
2022-12-11 14:49:57 -05:00
n.span
2022-12-08 11:42:54 -05:00
})
})
}
2022-11-12 12:45:17 -05:00
}
impl<C: Clone, A: Clone> Iterator for Branch<C, A> {
2022-12-10 04:26:06 -05:00
type Item = Event<C, A>;
2022-11-12 12:45:17 -05:00
fn next(&mut self) -> Option<Self::Item> {
if let Some(head) = self.head {
let n = &self.nodes[head.index()];
2022-11-28 14:12:49 -05:00
let kind = match &n.kind {
2022-12-08 11:42:54 -05:00
NodeKind::Root => unreachable!(),
2022-11-12 12:45:17 -05:00
NodeKind::Container(c, child) => {
self.branch.push(head);
self.head = *child;
2022-12-11 15:07:10 -05:00
EventKind::Enter(c.clone())
2022-11-12 12:45:17 -05:00
}
2022-12-12 12:22:13 -05:00
NodeKind::Atom(a) => {
2022-11-12 12:45:17 -05:00
self.head = n.next;
2022-12-12 12:22:13 -05:00
EventKind::Atom(a.clone())
2022-11-12 12:45:17 -05:00
}
2022-12-11 14:49:57 -05:00
NodeKind::Inline => {
self.head = n.next;
EventKind::Inline
}
2022-11-28 14:12:49 -05:00
};
Some(Event { kind, span: n.span })
2022-11-12 12:45:17 -05:00
} else if let Some(block_ni) = self.branch.pop() {
2022-11-28 18:33:43 -05:00
let Node { next, kind, span } = &self.nodes[block_ni.index()];
2022-12-12 12:22:13 -05:00
let kind = match kind {
NodeKind::Container(c, _) => EventKind::Exit(c.clone()),
_ => panic!(),
2022-11-28 18:33:43 -05:00
};
2022-11-12 12:45:17 -05:00
self.head = *next;
2022-12-12 12:22:13 -05:00
Some(Event { kind, span: *span })
2022-11-12 12:45:17 -05:00
} else {
None
}
}
}
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
struct NodeIndex(std::num::NonZeroUsize);
impl NodeIndex {
fn new(i: usize) -> Self {
assert_ne!(i, usize::MAX);
Self((i + 1).try_into().unwrap())
}
fn root() -> Self {
Self::new(0)
}
fn index(self) -> usize {
usize::from(self.0) - 1
}
}
2022-12-12 12:22:13 -05:00
#[derive(Debug, Clone, PartialEq, Eq)]
2022-12-10 04:26:06 -05:00
enum NodeKind<C, A> {
2022-11-12 12:45:17 -05:00
Root,
Container(C, Option<NodeIndex>),
2022-12-10 04:26:06 -05:00
Atom(A),
2022-12-11 14:49:57 -05:00
Inline,
2022-11-12 12:45:17 -05:00
}
#[derive(Debug, Clone)]
2022-12-10 04:26:06 -05:00
struct Node<C, A> {
2022-11-12 12:45:17 -05:00
span: Span,
2022-12-10 04:26:06 -05:00
kind: NodeKind<C, A>,
2022-11-12 12:45:17 -05:00
next: Option<NodeIndex>,
}
2022-12-10 04:26:06 -05:00
#[derive(Clone)]
pub struct Builder<C, A> {
nodes: Vec<Node<C, A>>,
2022-11-12 12:45:17 -05:00
branch: Vec<NodeIndex>,
head: Option<NodeIndex>,
}
2022-12-11 15:07:10 -05:00
impl<C: Clone, A: Clone> Builder<C, A> {
2022-11-12 12:45:17 -05:00
pub(super) fn new() -> Self {
Builder {
nodes: vec![Node {
span: Span::default(),
kind: NodeKind::Root,
next: None,
}],
branch: vec![],
head: Some(NodeIndex::root()),
}
}
2022-12-10 04:26:06 -05:00
pub(super) fn atom(&mut self, a: A, span: Span) {
2022-11-12 12:45:17 -05:00
self.add_node(Node {
span,
2022-12-10 04:26:06 -05:00
kind: NodeKind::Atom(a),
2022-11-12 12:45:17 -05:00
next: None,
});
}
2022-12-11 14:49:57 -05:00
pub(super) fn inline(&mut self, span: Span) {
self.add_node(Node {
span,
kind: NodeKind::Inline,
next: None,
});
}
2022-11-12 12:45:17 -05:00
pub(super) fn enter(&mut self, c: C, span: Span) {
self.add_node(Node {
span,
kind: NodeKind::Container(c, None),
next: None,
});
}
pub(super) fn exit(&mut self) {
if self.head.is_some() {
self.head = None;
} else {
let last = self.branch.pop();
assert_ne!(last, None);
}
}
2022-12-10 04:26:06 -05:00
pub(super) fn finish(self) -> Tree<C, A> {
Tree(self.nodes.into_boxed_slice())
2022-11-12 12:45:17 -05:00
}
2022-12-10 04:26:06 -05:00
fn add_node(&mut self, node: Node<C, A>) {
2022-11-12 12:45:17 -05:00
let ni = NodeIndex::new(self.nodes.len());
self.nodes.push(node);
if let Some(head_ni) = &mut self.head {
let mut head = &mut self.nodes[head_ni.index()];
match &mut head.kind {
2022-12-11 14:49:57 -05:00
NodeKind::Root | NodeKind::Inline | NodeKind::Atom(_) => {
// set next pointer of previous node
2022-11-12 12:45:17 -05:00
assert_eq!(head.next, None);
head.next = Some(ni);
}
NodeKind::Container(_, child) => {
self.branch.push(*head_ni);
2022-12-11 14:49:57 -05:00
// set child pointer of current container
2022-11-12 12:45:17 -05:00
assert_eq!(*child, None);
*child = Some(ni);
}
}
} else if let Some(block) = self.branch.pop() {
let mut block = &mut self.nodes[block.index()];
assert!(matches!(block.kind, NodeKind::Container(..)));
block.next = Some(ni);
} else {
panic!()
}
self.head = Some(ni);
}
}
impl<C: std::fmt::Debug + Clone + 'static, A: std::fmt::Debug + Clone + 'static> std::fmt::Debug
for Builder<C, A>
{
2022-11-12 12:45:17 -05:00
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
self.clone().finish().root().fmt(f)
2022-11-12 12:45:17 -05:00
}
}
impl<C: std::fmt::Debug + Clone, A: std::fmt::Debug + Clone> std::fmt::Debug for Branch<C, A> {
2022-11-12 12:45:17 -05:00
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
const INDENT: &str = " ";
let mut level = 0;
2022-12-12 12:22:13 -05:00
write!(f, "\n")?;
2022-12-11 15:07:10 -05:00
for e in self.clone() {
let indent = INDENT.repeat(level);
match e.kind {
EventKind::Enter(c) => {
write!(f, "{}{:?}", indent, c)?;
level += 1;
2022-11-28 14:12:49 -05:00
}
2022-12-11 15:07:10 -05:00
EventKind::Inline => write!(f, "{}Inline", indent)?,
EventKind::Exit(..) => {
level -= 1;
continue;
}
EventKind::Atom(a) => write!(f, "{}{:?}", indent, a)?,
}
writeln!(f, " ({}:{})", e.span.start(), e.span.end())?;
}
2022-11-12 12:45:17 -05:00
Ok(())
}
}
#[cfg(test)]
mod test {
use crate::Span;
use super::Event;
use super::EventKind;
2022-11-12 12:45:17 -05:00
#[test]
2022-12-12 12:22:13 -05:00
fn fmt() {
let mut tree = super::Builder::new();
tree.enter(1, Span::new(0, 1));
tree.atom(11, Span::new(0, 1));
tree.atom(12, Span::new(0, 1));
tree.exit();
tree.enter(2, Span::new(1, 5));
tree.enter(21, Span::new(2, 5));
tree.enter(211, Span::new(3, 4));
tree.atom(2111, Span::new(3, 4));
tree.exit();
tree.exit();
tree.enter(22, Span::new(4, 5));
tree.atom(221, Span::new(4, 5));
tree.exit();
tree.exit();
tree.enter(3, Span::new(5, 6));
tree.atom(31, Span::new(5, 6));
tree.exit();
2022-11-12 12:45:17 -05:00
assert_eq!(
2022-12-10 04:26:06 -05:00
format!("{:?}", tree),
2022-11-12 12:45:17 -05:00
concat!(
2022-12-12 12:22:13 -05:00
"\n",
"1 (0:1)\n",
" 11 (0:1)\n",
" 12 (0:1)\n",
"2 (1:5)\n",
" 21 (2:5)\n",
" 211 (3:4)\n",
" 2111 (3:4)\n",
" 22 (4:5)\n",
" 221 (4:5)\n",
"3 (5:6)\n",
" 31 (5:6)\n",
2022-11-12 12:45:17 -05:00
)
);
}
#[test]
fn branch_take_branch() {
let mut b = super::Builder::new();
let sp = Span::new(0, 0);
b.enter(1, sp);
b.atom(11, sp);
b.exit();
b.enter(2, sp);
b.enter(21, sp);
b.atom(211, sp);
b.exit();
b.exit();
b.enter(3, sp);
b.atom(31, sp);
let tree = b.finish();
let mut root_branch = tree.root();
2022-11-12 12:45:17 -05:00
assert_eq!(
(&mut root_branch).take(3).collect::<Vec<_>>(),
&[
Event {
kind: EventKind::Enter(1),
span: sp
},
Event {
kind: EventKind::Atom(11),
span: sp
},
Event {
kind: EventKind::Exit(1),
span: sp
},
]
);
assert_eq!(
root_branch.next(),
Some(Event {
kind: EventKind::Enter(2),
span: sp
})
);
assert_eq!(
root_branch.take_branch().collect::<Vec<_>>(),
&[
Event {
kind: EventKind::Enter(21),
span: sp
},
Event {
kind: EventKind::Atom(211),
span: sp
},
Event {
kind: EventKind::Exit(21),
span: sp
},
]
);
assert_eq!(
root_branch.collect::<Vec<_>>(),
&[
Event {
kind: EventKind::Enter(3),
span: sp
},
Event {
kind: EventKind::Atom(31),
span: sp
},
Event {
kind: EventKind::Exit(3),
span: sp
},
]
2022-11-12 12:45:17 -05:00
);
}
}