Merge remote-tracking branch 'origin/master'

author: Dmitry <[email protected]> 2020-08-14 19:32:05 +0100
committer: Dmitry <[email protected]> 2020-08-14 19:32:05 +0100
commit: 178c3e135a2a249692f7784712492e7884ae0c00 (patch)
tree: ac6b769dbf7162150caa0c1624786a4dd79ff3be /crates/syntax/src/parsing/text_token_source.rs
parent: 06ff8e6c760ff05f10e868b5d1f9d79e42fbb49c (diff)
parent: c2594daf2974dbd4ce3d9b7ec72481764abaceb5 (diff)
1 files changed, 84 insertions, 0 deletions
diff --git a/crates/syntax/src/parsing/text_token_source.rs b/crates/syntax/src/parsing/text_token_source.rs
new file mode 100644
index 000000000..df866dc2b
--- /dev/null
+++ b/crates/syntax/src/parsing/text_token_source.rs
@@ -0,0 +1,84 @@
+//! See `TextTokenSource` docs.
+use parser::TokenSource;
+use crate::{parsing::lexer::Token, SyntaxKind::EOF, TextRange, TextSize};
+/// Implementation of `parser::TokenSource` that takes tokens from source code text.
+pub(crate) struct TextTokenSource<'t> {
+    text: &'t str,
+    /// token and its start position (non-whitespace/comment tokens)
+    /// ```non-rust
+    ///  struct Foo;
+    ///  ^------^--^-
+    ///  |      |    \________
+    ///  |      \____         \
+    ///  |           \         |
+    ///  (struct, 0) (Foo, 7) (;, 10)
+    /// ```
+    /// `[(struct, 0), (Foo, 7), (;, 10)]`
+    token_offset_pairs: Vec<(Token, TextSize)>,
+    /// Current token and position
+    curr: (parser::Token, usize),
+}
+impl<'t> TokenSource for TextTokenSource<'t> {
+    fn current(&self) -> parser::Token {
+        self.curr.0
+    }
+    fn lookahead_nth(&self, n: usize) -> parser::Token {
+        mk_token(self.curr.1 + n, &self.token_offset_pairs)
+    }
+    fn bump(&mut self) {
+        if self.curr.0.kind == EOF {
+            return;
+        }
+        let pos = self.curr.1 + 1;
+        self.curr = (mk_token(pos, &self.token_offset_pairs), pos);
+    }
+    fn is_keyword(&self, kw: &str) -> bool {
+        self.token_offset_pairs
+            .get(self.curr.1)
+            .map(|(token, offset)| &self.text[TextRange::at(*offset, token.len)] == kw)
+            .unwrap_or(false)
+    }
+}
+fn mk_token(pos: usize, token_offset_pairs: &[(Token, TextSize)]) -> parser::Token {
+    let (kind, is_jointed_to_next) = match token_offset_pairs.get(pos) {
+        Some((token, offset)) => (
+            token.kind,
+            token_offset_pairs
+                .get(pos + 1)
+                .map(|(_, next_offset)| offset + token.len == *next_offset)
+                .unwrap_or(false),
+        ),
+        None => (EOF, false),
+    };
+    parser::Token { kind, is_jointed_to_next }
+}
+impl<'t> TextTokenSource<'t> {
+    /// Generate input from tokens(expect comment and whitespace).
+    pub fn new(text: &'t str, raw_tokens: &'t [Token]) -> TextTokenSource<'t> {
+        let token_offset_pairs: Vec<_> = raw_tokens
+            .iter()
+            .filter_map({
+                let mut len = 0.into();
+                move |token| {
+                    let pair = if token.kind.is_trivia() { None } else { Some((*token, len)) };
+                    len += token.len;
+                    pair
+                }
+            })
+            .collect();
+        let first = mk_token(0, &token_offset_pairs);
+        TextTokenSource { text, token_offset_pairs, curr: (first, 0) }
+    }
+}
author	Dmitry <[email protected]>	2020-08-14 19:32:05 +0100
committer	Dmitry <[email protected]>	2020-08-14 19:32:05 +0100
commit	178c3e135a2a249692f7784712492e7884ae0c00 (patch)
tree	ac6b769dbf7162150caa0c1624786a4dd79ff3be /crates/syntax/src/parsing/text_token_source.rs
parent	06ff8e6c760ff05f10e868b5d1f9d79e42fbb49c (diff)
parent	c2594daf2974dbd4ce3d9b7ec72481764abaceb5 (diff)

diff --git a/crates/syntax/src/parsing/text_token_source.rs b/crates/syntax/src/parsing/text_token_source.rs new file mode 100644 index 000000000..df866dc2b --- /dev/null +++ b/crates/syntax/src/parsing/text_token_source.rs
@@ -0,0 +1,84 @@
	1	//! See `TextTokenSource` docs.
	2
	3	use parser::TokenSource;
	4
	5	use crate::{parsing::lexer::Token, SyntaxKind::EOF, TextRange, TextSize};
	6
	7	/// Implementation of `parser::TokenSource` that takes tokens from source code text.
	8	pub(crate) struct TextTokenSource<'t> {
	9	text: &'t str,
	10	/// token and its start position (non-whitespace/comment tokens)
	11	/// ```non-rust
	12	/// struct Foo;
	13	/// ^------^--^-
	14	/// \| \| \________
	15	/// \| \____ \
	16	/// \| \ \|
	17	/// (struct, 0) (Foo, 7) (;, 10)
	18	/// ```
	19	/// `[(struct, 0), (Foo, 7), (;, 10)]`
	20	token_offset_pairs: Vec<(Token, TextSize)>,
	21
	22	/// Current token and position
	23	curr: (parser::Token, usize),
	24	}
	25
	26	impl<'t> TokenSource for TextTokenSource<'t> {
	27	fn current(&self) -> parser::Token {
	28	self.curr.0
	29	}
	30
	31	fn lookahead_nth(&self, n: usize) -> parser::Token {
	32	mk_token(self.curr.1 + n, &self.token_offset_pairs)
	33	}
	34
	35	fn bump(&mut self) {
	36	if self.curr.0.kind == EOF {
	37	return;
	38	}
	39
	40	let pos = self.curr.1 + 1;
	41	self.curr = (mk_token(pos, &self.token_offset_pairs), pos);
	42	}
	43
	44	fn is_keyword(&self, kw: &str) -> bool {
	45	self.token_offset_pairs
	46	.get(self.curr.1)
	47	.map(\|(token, offset)\| &self.text[TextRange::at(*offset, token.len)] == kw)
	48	.unwrap_or(false)
	49	}
	50	}
	51
	52	fn mk_token(pos: usize, token_offset_pairs: &[(Token, TextSize)]) -> parser::Token {
	53	let (kind, is_jointed_to_next) = match token_offset_pairs.get(pos) {
	54	Some((token, offset)) => (
	55	token.kind,
	56	token_offset_pairs
	57	.get(pos + 1)
	58	.map(\|(_, next_offset)\| offset + token.len == *next_offset)
	59	.unwrap_or(false),
	60	),
	61	None => (EOF, false),
	62	};
	63	parser::Token { kind, is_jointed_to_next }
	64	}
	65
	66	impl<'t> TextTokenSource<'t> {
	67	/// Generate input from tokens(expect comment and whitespace).
	68	pub fn new(text: &'t str, raw_tokens: &'t [Token]) -> TextTokenSource<'t> {
	69	let token_offset_pairs: Vec<_> = raw_tokens
	70	.iter()
	71	.filter_map({
	72	let mut len = 0.into();
	73	move \|token\| {
	74	let pair = if token.kind.is_trivia() { None } else { Some((*token, len)) };
	75	len += token.len;
	76	pair
	77	}
	78	})
	79	.collect();
	80
	81	let first = mk_token(0, &token_offset_pairs);
	82	TextTokenSource { text, token_offset_pairs, curr: (first, 0) }
	83	}
	84	}