2021-08-28 17:36:41 +00:00
|
|
|
//! Serialization-friendly representation of `tt::Subtree`.
|
|
|
|
//!
|
|
|
|
//! It is possible to serialize `Subtree` as is, as a tree, but using
|
|
|
|
//! arbitrary-nested trees in JSON is problematic, as they can cause the JSON
|
|
|
|
//! parser to overflow the stack.
|
|
|
|
//!
|
|
|
|
//! Additionally, such implementation would be pretty verbose, and we do care
|
|
|
|
//! about performance here a bit.
|
|
|
|
//!
|
|
|
|
//! So what this module does is dumping a `tt::Subtree` into a bunch of flat
|
|
|
|
//! array of numbers. See the test in the parent module to get an example
|
|
|
|
//! output.
|
|
|
|
//!
|
|
|
|
//! ```json
|
|
|
|
//! {
|
|
|
|
//! // Array of subtrees, each subtree is represented by 4 numbers:
|
|
|
|
//! // id of delimiter, delimiter kind, index of first child in `token_tree`,
|
|
|
|
//! // index of last child in `token_tree`
|
|
|
|
//! "subtree":[4294967295,0,0,5,2,2,5,5],
|
|
|
|
//! // 2 ints per literal: [token id, index into `text`]
|
|
|
|
//! "literal":[4294967295,1],
|
|
|
|
//! // 3 ints per punct: [token id, char, spacing]
|
|
|
|
//! "punct":[4294967295,64,1],
|
|
|
|
//! // 2 ints per ident: [token id, index into `text`]
|
|
|
|
//! "ident": [0,0,1,1],
|
|
|
|
//! // children of all subtrees, concatenated. Each child is represented as `index << 2 | tag`
|
|
|
|
//! // where tag denotes one of subtree, literal, punct or ident.
|
|
|
|
//! "token_tree":[3,7,1,4],
|
|
|
|
//! // Strings shared by idents and literals
|
|
|
|
//! "text": ["struct","Foo"]
|
|
|
|
//! }
|
|
|
|
//! ```
|
|
|
|
//!
|
|
|
|
//! We probably should replace most of the code here with bincode someday, but,
|
|
|
|
//! as we don't have bincode in Cargo.toml yet, lets stick with serde_json for
|
|
|
|
//! the time being.
|
|
|
|
|
2022-08-08 23:16:32 +00:00
|
|
|
use std::collections::{HashMap, VecDeque};
|
2021-08-28 17:36:41 +00:00
|
|
|
|
|
|
|
use serde::{Deserialize, Serialize};
|
2023-09-29 10:37:57 +00:00
|
|
|
use text_size::TextRange;
|
2023-10-06 12:47:11 +00:00
|
|
|
use tt::{Span, SyntaxContext};
|
2023-01-31 10:49:49 +00:00
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
use crate::msg::{ENCODE_CLOSE_SPAN_VERSION, VARIABLE_SIZED_SPANS};
|
|
|
|
|
|
|
|
pub trait SerializableSpan<const L: usize>: Span {
|
|
|
|
fn into_u32(self) -> [u32; L];
|
|
|
|
fn from_u32(input: [u32; L]) -> Self;
|
|
|
|
}
|
2023-10-06 12:47:11 +00:00
|
|
|
// impl SerializableSpan<1> for tt::TokenId {
|
|
|
|
// fn into_u32(self) -> [u32; 1] {
|
|
|
|
// [self.0]
|
|
|
|
// }
|
|
|
|
// fn from_u32([input]: [u32; 1]) -> Self {
|
|
|
|
// tt::TokenId(input)
|
|
|
|
// }
|
|
|
|
// }
|
2021-08-28 17:36:41 +00:00
|
|
|
|
2023-10-06 12:47:11 +00:00
|
|
|
impl<Anchor, Ctx> SerializableSpan<3> for tt::SpanData<Anchor, Ctx>
|
2023-09-29 10:37:57 +00:00
|
|
|
where
|
2023-10-06 12:47:11 +00:00
|
|
|
Anchor: From<u32> + Into<u32>,
|
2023-09-29 10:37:57 +00:00
|
|
|
Self: Span,
|
2023-10-06 12:47:11 +00:00
|
|
|
Ctx: SyntaxContext,
|
2023-09-29 10:37:57 +00:00
|
|
|
{
|
|
|
|
fn into_u32(self) -> [u32; 3] {
|
|
|
|
[self.anchor.into(), self.range.start().into(), self.range.end().into()]
|
|
|
|
}
|
|
|
|
fn from_u32([file_id, start, end]: [u32; 3]) -> Self {
|
2023-10-06 12:47:11 +00:00
|
|
|
tt::SpanData {
|
|
|
|
anchor: file_id.into(),
|
|
|
|
range: TextRange::new(start.into(), end.into()),
|
|
|
|
ctx: Ctx::DUMMY,
|
|
|
|
}
|
2023-09-29 10:37:57 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-28 17:36:41 +00:00
|
|
|
#[derive(Serialize, Deserialize, Debug)]
|
|
|
|
pub struct FlatTree {
|
|
|
|
subtree: Vec<u32>,
|
|
|
|
literal: Vec<u32>,
|
|
|
|
punct: Vec<u32>,
|
|
|
|
ident: Vec<u32>,
|
|
|
|
token_tree: Vec<u32>,
|
|
|
|
text: Vec<String>,
|
2023-06-29 10:23:45 +00:00
|
|
|
#[serde(skip_serializing_if = "SpanMap::do_serialize")]
|
|
|
|
#[serde(default)]
|
|
|
|
span_map: SpanMap,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Serialize, Deserialize, Debug)]
|
2023-11-25 13:39:55 +00:00
|
|
|
struct SpanMap {
|
2023-06-29 10:23:45 +00:00
|
|
|
#[serde(skip_serializing)]
|
|
|
|
serialize: bool,
|
|
|
|
span_size: u32,
|
|
|
|
spans: Vec<u32>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Default for SpanMap {
|
|
|
|
fn default() -> Self {
|
|
|
|
Self { serialize: false, span_size: 1, spans: Default::default() }
|
|
|
|
}
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl SpanMap {
|
|
|
|
fn serialize_span<const L: usize, S: SerializableSpan<L>>(&mut self, span: S) -> u32 {
|
|
|
|
let u32s = span.into_u32();
|
|
|
|
if L == 1 {
|
|
|
|
u32s[0]
|
|
|
|
} else {
|
|
|
|
let offset = self.spans.len() as u32;
|
|
|
|
self.spans.extend(u32s);
|
|
|
|
offset
|
|
|
|
}
|
|
|
|
}
|
|
|
|
fn deserialize_span<const L: usize, S: SerializableSpan<L>>(&self, offset: u32) -> S {
|
|
|
|
S::from_u32(if L == 1 {
|
|
|
|
[offset].as_ref().try_into().unwrap()
|
|
|
|
} else {
|
|
|
|
self.spans[offset as usize..][..L].try_into().unwrap()
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl SpanMap {
|
2023-11-25 13:39:55 +00:00
|
|
|
fn do_serialize(&self) -> bool {
|
2023-06-29 10:23:45 +00:00
|
|
|
self.serialize
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
struct SubtreeRepr<const L: usize, S> {
|
|
|
|
open: S,
|
|
|
|
close: S,
|
2023-01-31 10:49:49 +00:00
|
|
|
kind: tt::DelimiterKind,
|
2021-08-28 17:36:41 +00:00
|
|
|
tt: [u32; 2],
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
struct LiteralRepr<const L: usize, S> {
|
|
|
|
id: S,
|
2021-08-28 17:36:41 +00:00
|
|
|
text: u32,
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
struct PunctRepr<const L: usize, S> {
|
|
|
|
id: S,
|
2021-08-28 17:36:41 +00:00
|
|
|
char: char,
|
|
|
|
spacing: tt::Spacing,
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
struct IdentRepr<const L: usize, S> {
|
|
|
|
id: S,
|
2021-08-28 17:36:41 +00:00
|
|
|
text: u32,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl FlatTree {
|
2023-06-29 10:23:45 +00:00
|
|
|
pub fn new<const L: usize, S: SerializableSpan<L>>(
|
|
|
|
subtree: &tt::Subtree<S>,
|
|
|
|
version: u32,
|
|
|
|
) -> FlatTree {
|
2021-08-28 17:36:41 +00:00
|
|
|
let mut w = Writer {
|
|
|
|
string_table: HashMap::new(),
|
|
|
|
work: VecDeque::new(),
|
|
|
|
|
|
|
|
subtree: Vec::new(),
|
|
|
|
literal: Vec::new(),
|
|
|
|
punct: Vec::new(),
|
|
|
|
ident: Vec::new(),
|
|
|
|
token_tree: Vec::new(),
|
|
|
|
text: Vec::new(),
|
|
|
|
};
|
|
|
|
w.write(subtree);
|
2023-06-29 10:23:45 +00:00
|
|
|
assert!(L == 1 || version >= VARIABLE_SIZED_SPANS);
|
|
|
|
let mut span_map = SpanMap {
|
|
|
|
serialize: version >= VARIABLE_SIZED_SPANS && L != 1,
|
|
|
|
span_size: L as u32,
|
|
|
|
spans: Vec::new(),
|
|
|
|
};
|
2021-08-28 17:36:41 +00:00
|
|
|
return FlatTree {
|
2023-04-14 08:34:41 +00:00
|
|
|
subtree: if version >= ENCODE_CLOSE_SPAN_VERSION {
|
2023-06-29 10:23:45 +00:00
|
|
|
write_vec(&mut span_map, w.subtree, SubtreeRepr::write_with_close_span)
|
2023-04-14 08:34:41 +00:00
|
|
|
} else {
|
2023-06-29 10:23:45 +00:00
|
|
|
write_vec(&mut span_map, w.subtree, SubtreeRepr::write)
|
2023-04-14 08:34:41 +00:00
|
|
|
},
|
2023-06-29 10:23:45 +00:00
|
|
|
literal: write_vec(&mut span_map, w.literal, LiteralRepr::write),
|
|
|
|
punct: write_vec(&mut span_map, w.punct, PunctRepr::write),
|
|
|
|
ident: write_vec(&mut span_map, w.ident, IdentRepr::write),
|
2021-08-28 17:36:41 +00:00
|
|
|
token_tree: w.token_tree,
|
|
|
|
text: w.text,
|
2023-06-29 10:23:45 +00:00
|
|
|
span_map,
|
2021-08-28 17:36:41 +00:00
|
|
|
};
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
fn write_vec<T, F: Fn(T, &mut SpanMap) -> [u32; N], const N: usize>(
|
|
|
|
map: &mut SpanMap,
|
|
|
|
xs: Vec<T>,
|
|
|
|
f: F,
|
|
|
|
) -> Vec<u32> {
|
|
|
|
xs.into_iter().flat_map(|it| f(it, map)).collect()
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
pub fn to_subtree<const L: usize, S: SerializableSpan<L>>(
|
|
|
|
self,
|
|
|
|
version: u32,
|
|
|
|
) -> tt::Subtree<S> {
|
|
|
|
assert!((version >= VARIABLE_SIZED_SPANS || L == 1) && L as u32 == self.span_map.span_size);
|
2021-08-28 17:36:41 +00:00
|
|
|
return Reader {
|
2023-04-14 08:34:41 +00:00
|
|
|
subtree: if version >= ENCODE_CLOSE_SPAN_VERSION {
|
2023-06-29 10:23:45 +00:00
|
|
|
read_vec(&self.span_map, self.subtree, SubtreeRepr::read_with_close_span)
|
2023-04-14 08:34:41 +00:00
|
|
|
} else {
|
2023-06-29 10:23:45 +00:00
|
|
|
read_vec(&self.span_map, self.subtree, SubtreeRepr::read)
|
2023-04-14 08:34:41 +00:00
|
|
|
},
|
2023-06-29 10:23:45 +00:00
|
|
|
literal: read_vec(&self.span_map, self.literal, LiteralRepr::read),
|
|
|
|
punct: read_vec(&self.span_map, self.punct, PunctRepr::read),
|
|
|
|
ident: read_vec(&self.span_map, self.ident, IdentRepr::read),
|
2021-08-28 17:36:41 +00:00
|
|
|
token_tree: self.token_tree,
|
|
|
|
text: self.text,
|
|
|
|
}
|
|
|
|
.read();
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
fn read_vec<T, F: Fn([u32; N], &SpanMap) -> T, const N: usize>(
|
|
|
|
map: &SpanMap,
|
|
|
|
xs: Vec<u32>,
|
|
|
|
f: F,
|
|
|
|
) -> Vec<T> {
|
2021-08-28 17:36:41 +00:00
|
|
|
let mut chunks = xs.chunks_exact(N);
|
2023-06-29 10:23:45 +00:00
|
|
|
let res = chunks.by_ref().map(|chunk| f(chunk.try_into().unwrap(), map)).collect();
|
2021-08-28 17:36:41 +00:00
|
|
|
assert!(chunks.remainder().is_empty());
|
|
|
|
res
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl<const L: usize, S: SerializableSpan<L>> SubtreeRepr<L, S> {
|
|
|
|
fn write(self, map: &mut SpanMap) -> [u32; 4] {
|
2021-08-28 17:36:41 +00:00
|
|
|
let kind = match self.kind {
|
2023-01-31 10:49:49 +00:00
|
|
|
tt::DelimiterKind::Invisible => 0,
|
|
|
|
tt::DelimiterKind::Parenthesis => 1,
|
|
|
|
tt::DelimiterKind::Brace => 2,
|
|
|
|
tt::DelimiterKind::Bracket => 3,
|
2021-08-28 17:36:41 +00:00
|
|
|
};
|
2023-06-29 10:23:45 +00:00
|
|
|
[map.serialize_span(self.open), kind, self.tt[0], self.tt[1]]
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
2023-06-29 10:23:45 +00:00
|
|
|
fn read([open, kind, lo, len]: [u32; 4], map: &SpanMap) -> Self {
|
2021-08-28 17:36:41 +00:00
|
|
|
let kind = match kind {
|
2023-01-31 10:49:49 +00:00
|
|
|
0 => tt::DelimiterKind::Invisible,
|
|
|
|
1 => tt::DelimiterKind::Parenthesis,
|
|
|
|
2 => tt::DelimiterKind::Brace,
|
|
|
|
3 => tt::DelimiterKind::Bracket,
|
2022-12-23 18:42:58 +00:00
|
|
|
other => panic!("bad kind {other}"),
|
2021-08-28 17:36:41 +00:00
|
|
|
};
|
2023-06-29 10:23:45 +00:00
|
|
|
SubtreeRepr { open: map.deserialize_span(open), close: S::DUMMY, kind, tt: [lo, len] }
|
2023-04-14 08:34:41 +00:00
|
|
|
}
|
2023-06-29 10:23:45 +00:00
|
|
|
fn write_with_close_span(self, map: &mut SpanMap) -> [u32; 5] {
|
2023-04-14 08:34:41 +00:00
|
|
|
let kind = match self.kind {
|
|
|
|
tt::DelimiterKind::Invisible => 0,
|
|
|
|
tt::DelimiterKind::Parenthesis => 1,
|
|
|
|
tt::DelimiterKind::Brace => 2,
|
|
|
|
tt::DelimiterKind::Bracket => 3,
|
|
|
|
};
|
2023-06-29 10:23:45 +00:00
|
|
|
[
|
|
|
|
map.serialize_span(self.open),
|
|
|
|
map.serialize_span(self.close),
|
|
|
|
kind,
|
|
|
|
self.tt[0],
|
|
|
|
self.tt[1],
|
|
|
|
]
|
2023-04-14 08:34:41 +00:00
|
|
|
}
|
2023-06-29 10:23:45 +00:00
|
|
|
fn read_with_close_span([open, close, kind, lo, len]: [u32; 5], map: &SpanMap) -> Self {
|
2023-04-14 08:34:41 +00:00
|
|
|
let kind = match kind {
|
|
|
|
0 => tt::DelimiterKind::Invisible,
|
|
|
|
1 => tt::DelimiterKind::Parenthesis,
|
|
|
|
2 => tt::DelimiterKind::Brace,
|
|
|
|
3 => tt::DelimiterKind::Bracket,
|
|
|
|
other => panic!("bad kind {other}"),
|
|
|
|
};
|
2023-06-29 10:23:45 +00:00
|
|
|
SubtreeRepr {
|
|
|
|
open: map.deserialize_span(open),
|
|
|
|
close: map.deserialize_span(close),
|
|
|
|
kind,
|
|
|
|
tt: [lo, len],
|
|
|
|
}
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl<const L: usize, S: SerializableSpan<L>> LiteralRepr<L, S> {
|
|
|
|
fn write(self, map: &mut SpanMap) -> [u32; 2] {
|
|
|
|
[map.serialize_span(self.id), self.text]
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
2023-06-29 10:23:45 +00:00
|
|
|
fn read([id, text]: [u32; 2], map: &SpanMap) -> Self {
|
|
|
|
LiteralRepr { id: map.deserialize_span(id), text }
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl<const L: usize, S: SerializableSpan<L>> PunctRepr<L, S> {
|
|
|
|
fn write(self, map: &mut SpanMap) -> [u32; 3] {
|
2021-08-28 17:36:41 +00:00
|
|
|
let spacing = match self.spacing {
|
|
|
|
tt::Spacing::Alone => 0,
|
|
|
|
tt::Spacing::Joint => 1,
|
|
|
|
};
|
2023-06-29 10:23:45 +00:00
|
|
|
[map.serialize_span(self.id), self.char as u32, spacing]
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
2023-06-29 10:23:45 +00:00
|
|
|
fn read([id, char, spacing]: [u32; 3], map: &SpanMap) -> Self {
|
2021-08-28 17:36:41 +00:00
|
|
|
let spacing = match spacing {
|
|
|
|
0 => tt::Spacing::Alone,
|
|
|
|
1 => tt::Spacing::Joint,
|
2022-12-23 18:42:58 +00:00
|
|
|
other => panic!("bad spacing {other}"),
|
2021-08-28 17:36:41 +00:00
|
|
|
};
|
2023-06-29 10:23:45 +00:00
|
|
|
PunctRepr { id: map.deserialize_span(id), char: char.try_into().unwrap(), spacing }
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl<const L: usize, S: SerializableSpan<L>> IdentRepr<L, S> {
|
|
|
|
fn write(self, map: &mut SpanMap) -> [u32; 2] {
|
|
|
|
[map.serialize_span(self.id), self.text]
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
2023-06-29 10:23:45 +00:00
|
|
|
fn read(data: [u32; 2], map: &SpanMap) -> Self {
|
|
|
|
IdentRepr { id: map.deserialize_span(data[0]), text: data[1] }
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
struct Writer<'a, const L: usize, S> {
|
|
|
|
work: VecDeque<(usize, &'a tt::Subtree<S>)>,
|
2021-08-28 17:36:41 +00:00
|
|
|
string_table: HashMap<&'a str, u32>,
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
subtree: Vec<SubtreeRepr<L, S>>,
|
|
|
|
literal: Vec<LiteralRepr<L, S>>,
|
|
|
|
punct: Vec<PunctRepr<L, S>>,
|
|
|
|
ident: Vec<IdentRepr<L, S>>,
|
2021-08-28 17:36:41 +00:00
|
|
|
token_tree: Vec<u32>,
|
|
|
|
text: Vec<String>,
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl<'a, const L: usize, S: Copy> Writer<'a, L, S> {
|
|
|
|
fn write(&mut self, root: &'a tt::Subtree<S>) {
|
2021-08-28 17:36:41 +00:00
|
|
|
self.enqueue(root);
|
|
|
|
while let Some((idx, subtree)) = self.work.pop_front() {
|
|
|
|
self.subtree(idx, subtree);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
fn subtree(&mut self, idx: usize, subtree: &'a tt::Subtree<S>) {
|
2021-08-28 17:36:41 +00:00
|
|
|
let mut first_tt = self.token_tree.len();
|
|
|
|
let n_tt = subtree.token_trees.len();
|
|
|
|
self.token_tree.resize(first_tt + n_tt, !0);
|
|
|
|
|
|
|
|
self.subtree[idx].tt = [first_tt as u32, (first_tt + n_tt) as u32];
|
|
|
|
|
|
|
|
for child in &subtree.token_trees {
|
|
|
|
let idx_tag = match child {
|
|
|
|
tt::TokenTree::Subtree(it) => {
|
|
|
|
let idx = self.enqueue(it);
|
2022-12-30 10:02:45 +00:00
|
|
|
idx << 2
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
tt::TokenTree::Leaf(leaf) => match leaf {
|
|
|
|
tt::Leaf::Literal(lit) => {
|
|
|
|
let idx = self.literal.len() as u32;
|
|
|
|
let text = self.intern(&lit.text);
|
2023-01-31 10:49:49 +00:00
|
|
|
self.literal.push(LiteralRepr { id: lit.span, text });
|
2021-08-28 17:36:41 +00:00
|
|
|
idx << 2 | 0b01
|
|
|
|
}
|
|
|
|
tt::Leaf::Punct(punct) => {
|
|
|
|
let idx = self.punct.len() as u32;
|
|
|
|
self.punct.push(PunctRepr {
|
|
|
|
char: punct.char,
|
|
|
|
spacing: punct.spacing,
|
2023-01-31 10:49:49 +00:00
|
|
|
id: punct.span,
|
2021-08-28 17:36:41 +00:00
|
|
|
});
|
|
|
|
idx << 2 | 0b10
|
|
|
|
}
|
|
|
|
tt::Leaf::Ident(ident) => {
|
|
|
|
let idx = self.ident.len() as u32;
|
|
|
|
let text = self.intern(&ident.text);
|
2023-01-31 10:49:49 +00:00
|
|
|
self.ident.push(IdentRepr { id: ident.span, text });
|
2021-08-28 17:36:41 +00:00
|
|
|
idx << 2 | 0b11
|
|
|
|
}
|
|
|
|
},
|
|
|
|
};
|
|
|
|
self.token_tree[first_tt] = idx_tag;
|
|
|
|
first_tt += 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
fn enqueue(&mut self, subtree: &'a tt::Subtree<S>) -> u32 {
|
2021-08-28 17:36:41 +00:00
|
|
|
let idx = self.subtree.len();
|
2023-04-14 08:34:41 +00:00
|
|
|
let open = subtree.delimiter.open;
|
|
|
|
let close = subtree.delimiter.close;
|
2023-01-31 10:49:49 +00:00
|
|
|
let delimiter_kind = subtree.delimiter.kind;
|
2023-04-14 08:34:41 +00:00
|
|
|
self.subtree.push(SubtreeRepr { open, close, kind: delimiter_kind, tt: [!0, !0] });
|
2021-08-28 17:36:41 +00:00
|
|
|
self.work.push_back((idx, subtree));
|
|
|
|
idx as u32
|
|
|
|
}
|
|
|
|
|
|
|
|
pub(crate) fn intern(&mut self, text: &'a str) -> u32 {
|
|
|
|
let table = &mut self.text;
|
|
|
|
*self.string_table.entry(text).or_insert_with(|| {
|
|
|
|
let idx = table.len();
|
|
|
|
table.push(text.to_string());
|
|
|
|
idx as u32
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
struct Reader<const L: usize, S> {
|
|
|
|
subtree: Vec<SubtreeRepr<L, S>>,
|
|
|
|
literal: Vec<LiteralRepr<L, S>>,
|
|
|
|
punct: Vec<PunctRepr<L, S>>,
|
|
|
|
ident: Vec<IdentRepr<L, S>>,
|
2021-08-28 17:36:41 +00:00
|
|
|
token_tree: Vec<u32>,
|
|
|
|
text: Vec<String>,
|
|
|
|
}
|
|
|
|
|
2023-06-29 10:23:45 +00:00
|
|
|
impl<const L: usize, S: SerializableSpan<L>> Reader<L, S> {
|
|
|
|
pub(crate) fn read(self) -> tt::Subtree<S> {
|
|
|
|
let mut res: Vec<Option<tt::Subtree<S>>> = vec![None; self.subtree.len()];
|
2021-08-28 17:36:41 +00:00
|
|
|
for i in (0..self.subtree.len()).rev() {
|
|
|
|
let repr = &self.subtree[i];
|
|
|
|
let token_trees = &self.token_tree[repr.tt[0] as usize..repr.tt[1] as usize];
|
|
|
|
let s = tt::Subtree {
|
2023-04-14 08:34:41 +00:00
|
|
|
delimiter: tt::Delimiter { open: repr.open, close: repr.close, kind: repr.kind },
|
2021-08-28 17:36:41 +00:00
|
|
|
token_trees: token_trees
|
|
|
|
.iter()
|
|
|
|
.copied()
|
|
|
|
.map(|idx_tag| {
|
|
|
|
let tag = idx_tag & 0b11;
|
|
|
|
let idx = (idx_tag >> 2) as usize;
|
|
|
|
match tag {
|
|
|
|
// XXX: we iterate subtrees in reverse to guarantee
|
|
|
|
// that this unwrap doesn't fire.
|
|
|
|
0b00 => res[idx].take().unwrap().into(),
|
|
|
|
0b01 => {
|
|
|
|
let repr = &self.literal[idx];
|
|
|
|
tt::Leaf::Literal(tt::Literal {
|
|
|
|
text: self.text[repr.text as usize].as_str().into(),
|
2023-01-31 10:49:49 +00:00
|
|
|
span: repr.id,
|
2021-08-28 17:36:41 +00:00
|
|
|
})
|
|
|
|
.into()
|
|
|
|
}
|
|
|
|
0b10 => {
|
|
|
|
let repr = &self.punct[idx];
|
|
|
|
tt::Leaf::Punct(tt::Punct {
|
|
|
|
char: repr.char,
|
|
|
|
spacing: repr.spacing,
|
2023-01-31 10:49:49 +00:00
|
|
|
span: repr.id,
|
2021-08-28 17:36:41 +00:00
|
|
|
})
|
|
|
|
.into()
|
|
|
|
}
|
|
|
|
0b11 => {
|
|
|
|
let repr = &self.ident[idx];
|
|
|
|
tt::Leaf::Ident(tt::Ident {
|
|
|
|
text: self.text[repr.text as usize].as_str().into(),
|
2023-01-31 10:49:49 +00:00
|
|
|
span: repr.id,
|
2021-08-28 17:36:41 +00:00
|
|
|
})
|
|
|
|
.into()
|
|
|
|
}
|
2022-12-23 18:42:58 +00:00
|
|
|
other => panic!("bad tag: {other}"),
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
})
|
|
|
|
.collect(),
|
|
|
|
};
|
2021-10-03 12:39:43 +00:00
|
|
|
res[i] = Some(s);
|
2021-08-28 17:36:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
res[0].take().unwrap()
|
|
|
|
}
|
|
|
|
}
|