difftreelog
refactor use grammar to classify tokens
in: master
13 files changed
cmds/jrsonnet-fmt/src/main.rsdiffbeforeafterboth--- a/cmds/jrsonnet-fmt/src/main.rs
+++ b/cmds/jrsonnet-fmt/src/main.rs
@@ -5,7 +5,7 @@
nodes::{
ArgsDesc, Assertion, BinaryOperator, Bind, CompSpec, Destruct, DestructArrayPart,
DestructRest, Expr, Field, FieldName, ForSpec, IfSpec, ImportKind, LhsExpr, Literal,
- Member, Name, Number, ObjBody, ObjLocal, ParamsDesc, SliceDesc, SourceFile, String,
+ Member, Name, Number, ObjBody, ObjLocal, ParamsDesc, SliceDesc, SourceFile, Text,
UnaryOperator,
},
AstToken, SyntaxToken,
@@ -91,7 +91,7 @@
}
}
-impl Printable for String {
+impl Printable for Text {
fn print(&self) -> PrintItems {
p!(new: str(&format!("{}", self)))
}
@@ -168,7 +168,7 @@
FieldName::FieldNameFixed(f) => {
if let Some(id) = f.id() {
p!(new: {id})
- } else if let Some(str) = f.string() {
+ } else if let Some(str) = f.text() {
p!(new: {str})
} else {
p!(new: str("/*missing FieldName*/"))
@@ -371,7 +371,7 @@
Expr::ExprIntrinsicThisFile(_) => p!(new: str("$intrinsicThisFile")),
Expr::ExprIntrinsicId(_) => p!(new: str("$intrinsicId")),
Expr::ExprIntrinsic(i) => p!(new: str("$intrinsic(") {i.name()} str(")")),
- Expr::ExprString(s) => p!(new: {s.string()}),
+ Expr::ExprString(s) => p!(new: {s.text()}),
Expr::ExprNumber(n) => p!(new: {n.number()}),
Expr::ExprArray(a) => {
let mut pi = p!(new: str("[") >i nl);
@@ -393,7 +393,7 @@
pi
}
Expr::ExprImport(v) => {
- p!(new: {v.import_kind()} str(" ") {v.string()})
+ p!(new: {v.import_kind()} str(" ") {v.text()})
}
Expr::ExprVar(n) => p!(new: {n.name()}),
Expr::ExprLocal(l) => {
crates/jrsonnet-rowan-parser/jsonnet.ungramdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/jsonnet.ungram
+++ b/crates/jrsonnet-rowan-parser/jsonnet.ungram
@@ -48,7 +48,7 @@
name:Name
')'
ExprString =
- String
+ Text
ExprNumber =
Number
ExprArray =
@@ -67,7 +67,7 @@
']'
ExprImport =
- ImportKind String
+ ImportKind Text
ImportKind =
'importstr'
@@ -217,7 +217,7 @@
FieldNameFixed =
id:Name
-| String
+| Text
FieldNameDynamic =
'['
Expr
@@ -239,16 +239,27 @@
| '$'
| 'super'
-String =
+Text =
'LIT_STRING_DOUBLE!'
+| 'ERROR_STRING_DOUBLE_UNTERMINATED!'
| 'LIT_STRING_SINGLE!'
+| 'ERROR_STRING_SINGLE_UNTERMINATED!'
| 'LIT_STRING_DOUBLE_VERBATIM!'
+| 'ERROR_STRING_DOUBLE_VERBATIM_UNTERMINATED!'
| 'LIT_STRING_SINGLE_VERBATIM!'
+| 'ERROR_STRING_SINGLE_VERBATIM_UNTERMINATED!'
+| 'ERROR_STRING_VERBATIM_MISSING_QUOTES!'
| 'LIT_STRING_BLOCK!'
+| 'ERROR_STRING_BLOCK_UNEXPECTED_END!'
+| 'ERROR_STRING_BLOCK_MISSING_NEW_LINE!'
+| 'ERROR_STRING_BLOCK_MISSING_TERMINATION!'
+| 'ERROR_STRING_BLOCK_MISSING_INDENT!'
Number =
'LIT_FLOAT!'
-| 'META_FORCE_ENUM!'
+| 'ERROR_FLOAT_JUNK_AFTER_POINT!'
+| 'ERROR_FLOAT_JUNK_AFTER_EXPONENT!'
+| 'ERROR_FLOAT_JUNK_AFTER_EXPONENT_SIGN!'
ForSpec =
'for'
@@ -347,3 +358,12 @@
TrueExpr=Expr
FalseExpr=Expr
LhsExpr=Expr
+
+// Trivia - tokens which will be implicitly skipped for parser
+Trivia =
+ 'LIT_WHITESPACE!'
+| 'LIT_MULTI_LINE_COMMENT!'
+| 'ERROR_COMMENT_TOO_SHORT!'
+| 'ERROR_COMMENT_UNTERMINATED!'
+| 'LIT_SINGLE_LINE_HASH_COMMENT!'
+| 'LIT_SINGLE_LINE_SLASH_COMMENT!'
crates/jrsonnet-rowan-parser/src/classify.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/classify.rs
+++ /dev/null
@@ -1,51 +0,0 @@
-use crate::SyntaxKind;
-
-impl SyntaxKind {
- pub fn is_trivia(self) -> bool {
- matches!(
- self,
- Self::WHITESPACE
- | Self::MULTI_LINE_COMMENT
- | Self::ERROR_COMMENT_TOO_SHORT
- | Self::ERROR_COMMENT_UNTERMINATED
- | Self::SINGLE_LINE_HASH_COMMENT
- | Self::SINGLE_LINE_SLASH_COMMENT
- )
- }
- pub fn is_string(self) -> bool {
- matches!(
- self,
- Self::STRING_SINGLE
- | Self::ERROR_STRING_SINGLE_UNTERMINATED
- | Self::STRING_DOUBLE
- | Self::ERROR_STRING_DOUBLE_UNTERMINATED
- | Self::STRING_SINGLE_VERBATIM
- | Self::ERROR_STRING_SINGLE_VERBATIM_UNTERMINATED
- | Self::STRING_DOUBLE_VERBATIM
- | Self::ERROR_STRING_DOUBLE_VERBATIM_UNTERMINATED
- | Self::STRING_BLOCK
- | Self::ERROR_STRING_BLOCK_UNEXPECTED_END
- | Self::ERROR_STRING_BLOCK_MISSING_NEW_LINE
- | Self::ERROR_STRING_BLOCK_MISSING_TERMINATION
- | Self::ERROR_STRING_BLOCK_MISSING_INDENT
- )
- }
- pub fn is_number(self) -> bool {
- matches!(
- self,
- Self::FLOAT
- | Self::ERROR_FLOAT_JUNK_AFTER_POINT
- | Self::ERROR_FLOAT_JUNK_AFTER_EXPONENT
- | Self::ERROR_FLOAT_JUNK_AFTER_EXPONENT_SIGN
- )
- }
- pub fn is_literal(self) -> bool {
- matches!(
- self,
- Self::NULL_KW
- | Self::TRUE_KW | Self::FALSE_KW
- | Self::SELF_KW | Self::DOLLAR
- | Self::SUPER_KW
- )
- }
-}
crates/jrsonnet-rowan-parser/src/event.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/event.rs
+++ b/crates/jrsonnet-rowan-parser/src/event.rs
@@ -4,8 +4,9 @@
use crate::{
lex::Lexeme,
+ nodes::Trivia,
parser::{Parse, SyntaxError},
- JsonnetLanguage, SyntaxKind,
+ AstToken, JsonnetLanguage, SyntaxKind,
};
#[derive(Clone, Debug, PartialEq, Eq)]
@@ -144,7 +145,7 @@
}
fn skip_whitespace(&mut self) {
while let Some(lexeme) = self.lexemes.get(self.offset) {
- if !lexeme.kind.is_trivia() {
+ if !Trivia::can_cast(lexeme.kind) {
break;
}
crates/jrsonnet-rowan-parser/src/generated/nodes.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/generated/nodes.rs
+++ b/crates/jrsonnet-rowan-parser/src/generated/nodes.rs
@@ -255,7 +255,7 @@
pub(crate) syntax: SyntaxNode,
}
impl ExprString {
- pub fn string(&self) -> Option<String> {
+ pub fn text(&self) -> Option<Text> {
support::token_child(&self.syntax)
}
}
@@ -332,7 +332,7 @@
pub fn import_kind(&self) -> Option<ImportKind> {
support::token_child(&self.syntax)
}
- pub fn string(&self) -> Option<String> {
+ pub fn text(&self) -> Option<Text> {
support::token_child(&self.syntax)
}
}
@@ -692,7 +692,7 @@
pub fn id(&self) -> Option<Name> {
support::child(&self.syntax)
}
- pub fn string(&self) -> Option<String> {
+ pub fn text(&self) -> Option<Text> {
support::token_child(&self.syntax)
}
}
@@ -1038,18 +1038,27 @@
}
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
-pub struct String {
+pub struct Text {
syntax: SyntaxToken,
- kind: StringKind,
+ kind: TextKind,
}
#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
-pub enum StringKind {
+pub enum TextKind {
StringDouble,
+ ErrorStringDoubleUnterminated,
StringSingle,
+ ErrorStringSingleUnterminated,
StringDoubleVerbatim,
+ ErrorStringDoubleVerbatimUnterminated,
StringSingleVerbatim,
+ ErrorStringSingleVerbatimUnterminated,
+ ErrorStringVerbatimMissingQuotes,
StringBlock,
+ ErrorStringBlockUnexpectedEnd,
+ ErrorStringBlockMissingNewLine,
+ ErrorStringBlockMissingTermination,
+ ErrorStringBlockMissingIndent,
}
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
@@ -1061,7 +1070,9 @@
#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
pub enum NumberKind {
Float,
- MetaForceEnum,
+ ErrorFloatJunkAfterPoint,
+ ErrorFloatJunkAfterExponent,
+ ErrorFloatJunkAfterExponentSign,
}
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
@@ -1089,6 +1100,22 @@
Coloncolon,
Colon,
}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct Trivia {
+ syntax: SyntaxToken,
+ kind: TriviaKind,
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum TriviaKind {
+ Whitespace,
+ MultiLineComment,
+ ErrorCommentTooShort,
+ ErrorCommentUnterminated,
+ SingleLineHashComment,
+ SingleLineSlashComment,
+}
impl AstNode for SourceFile {
fn can_cast(kind: SyntaxKind) -> bool {
kind == SOURCE_FILE
@@ -2677,39 +2704,84 @@
std::fmt::Display::fmt(self.syntax(), f)
}
}
-impl AstToken for String {
+impl AstToken for Text {
fn can_cast(kind: SyntaxKind) -> bool {
match kind {
STRING_DOUBLE
+ | ERROR_STRING_DOUBLE_UNTERMINATED
| STRING_SINGLE
+ | ERROR_STRING_SINGLE_UNTERMINATED
| STRING_DOUBLE_VERBATIM
+ | ERROR_STRING_DOUBLE_VERBATIM_UNTERMINATED
| STRING_SINGLE_VERBATIM
- | STRING_BLOCK => true,
+ | ERROR_STRING_SINGLE_VERBATIM_UNTERMINATED
+ | ERROR_STRING_VERBATIM_MISSING_QUOTES
+ | STRING_BLOCK
+ | ERROR_STRING_BLOCK_UNEXPECTED_END
+ | ERROR_STRING_BLOCK_MISSING_NEW_LINE
+ | ERROR_STRING_BLOCK_MISSING_TERMINATION
+ | ERROR_STRING_BLOCK_MISSING_INDENT => true,
_ => false,
}
}
fn cast(syntax: SyntaxToken) -> Option<Self> {
let res = match syntax.kind() {
- STRING_DOUBLE => String {
+ STRING_DOUBLE => Text {
syntax,
- kind: StringKind::StringDouble,
+ kind: TextKind::StringDouble,
},
- STRING_SINGLE => String {
+ ERROR_STRING_DOUBLE_UNTERMINATED => Text {
syntax,
- kind: StringKind::StringSingle,
+ kind: TextKind::ErrorStringDoubleUnterminated,
},
- STRING_DOUBLE_VERBATIM => String {
+ STRING_SINGLE => Text {
syntax,
- kind: StringKind::StringDoubleVerbatim,
+ kind: TextKind::StringSingle,
},
- STRING_SINGLE_VERBATIM => String {
+ ERROR_STRING_SINGLE_UNTERMINATED => Text {
syntax,
- kind: StringKind::StringSingleVerbatim,
+ kind: TextKind::ErrorStringSingleUnterminated,
},
- STRING_BLOCK => String {
+ STRING_DOUBLE_VERBATIM => Text {
syntax,
- kind: StringKind::StringBlock,
+ kind: TextKind::StringDoubleVerbatim,
+ },
+ ERROR_STRING_DOUBLE_VERBATIM_UNTERMINATED => Text {
+ syntax,
+ kind: TextKind::ErrorStringDoubleVerbatimUnterminated,
+ },
+ STRING_SINGLE_VERBATIM => Text {
+ syntax,
+ kind: TextKind::StringSingleVerbatim,
},
+ ERROR_STRING_SINGLE_VERBATIM_UNTERMINATED => Text {
+ syntax,
+ kind: TextKind::ErrorStringSingleVerbatimUnterminated,
+ },
+ ERROR_STRING_VERBATIM_MISSING_QUOTES => Text {
+ syntax,
+ kind: TextKind::ErrorStringVerbatimMissingQuotes,
+ },
+ STRING_BLOCK => Text {
+ syntax,
+ kind: TextKind::StringBlock,
+ },
+ ERROR_STRING_BLOCK_UNEXPECTED_END => Text {
+ syntax,
+ kind: TextKind::ErrorStringBlockUnexpectedEnd,
+ },
+ ERROR_STRING_BLOCK_MISSING_NEW_LINE => Text {
+ syntax,
+ kind: TextKind::ErrorStringBlockMissingNewLine,
+ },
+ ERROR_STRING_BLOCK_MISSING_TERMINATION => Text {
+ syntax,
+ kind: TextKind::ErrorStringBlockMissingTermination,
+ },
+ ERROR_STRING_BLOCK_MISSING_INDENT => Text {
+ syntax,
+ kind: TextKind::ErrorStringBlockMissingIndent,
+ },
_ => return None,
};
Some(res)
@@ -2718,12 +2790,12 @@
&self.syntax
}
}
-impl String {
- pub fn kind(&self) -> StringKind {
+impl Text {
+ pub fn kind(&self) -> TextKind {
self.kind
}
}
-impl std::fmt::Display for String {
+impl std::fmt::Display for Text {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
std::fmt::Display::fmt(self.syntax(), f)
}
@@ -2731,7 +2803,10 @@
impl AstToken for Number {
fn can_cast(kind: SyntaxKind) -> bool {
match kind {
- FLOAT | META_FORCE_ENUM => true,
+ FLOAT
+ | ERROR_FLOAT_JUNK_AFTER_POINT
+ | ERROR_FLOAT_JUNK_AFTER_EXPONENT
+ | ERROR_FLOAT_JUNK_AFTER_EXPONENT_SIGN => true,
_ => false,
}
}
@@ -2741,10 +2816,18 @@
syntax,
kind: NumberKind::Float,
},
- META_FORCE_ENUM => Number {
+ ERROR_FLOAT_JUNK_AFTER_POINT => Number {
+ syntax,
+ kind: NumberKind::ErrorFloatJunkAfterPoint,
+ },
+ ERROR_FLOAT_JUNK_AFTER_EXPONENT => Number {
syntax,
- kind: NumberKind::MetaForceEnum,
+ kind: NumberKind::ErrorFloatJunkAfterExponent,
},
+ ERROR_FLOAT_JUNK_AFTER_EXPONENT_SIGN => Number {
+ syntax,
+ kind: NumberKind::ErrorFloatJunkAfterExponentSign,
+ },
_ => return None,
};
Some(res)
@@ -2841,6 +2924,62 @@
std::fmt::Display::fmt(self.syntax(), f)
}
}
+impl AstToken for Trivia {
+ fn can_cast(kind: SyntaxKind) -> bool {
+ match kind {
+ WHITESPACE
+ | MULTI_LINE_COMMENT
+ | ERROR_COMMENT_TOO_SHORT
+ | ERROR_COMMENT_UNTERMINATED
+ | SINGLE_LINE_HASH_COMMENT
+ | SINGLE_LINE_SLASH_COMMENT => true,
+ _ => false,
+ }
+ }
+ fn cast(syntax: SyntaxToken) -> Option<Self> {
+ let res = match syntax.kind() {
+ WHITESPACE => Trivia {
+ syntax,
+ kind: TriviaKind::Whitespace,
+ },
+ MULTI_LINE_COMMENT => Trivia {
+ syntax,
+ kind: TriviaKind::MultiLineComment,
+ },
+ ERROR_COMMENT_TOO_SHORT => Trivia {
+ syntax,
+ kind: TriviaKind::ErrorCommentTooShort,
+ },
+ ERROR_COMMENT_UNTERMINATED => Trivia {
+ syntax,
+ kind: TriviaKind::ErrorCommentUnterminated,
+ },
+ SINGLE_LINE_HASH_COMMENT => Trivia {
+ syntax,
+ kind: TriviaKind::SingleLineHashComment,
+ },
+ SINGLE_LINE_SLASH_COMMENT => Trivia {
+ syntax,
+ kind: TriviaKind::SingleLineSlashComment,
+ },
+ _ => return None,
+ };
+ Some(res)
+ }
+ fn syntax(&self) -> &SyntaxToken {
+ &self.syntax
+ }
+}
+impl Trivia {
+ pub fn kind(&self) -> TriviaKind {
+ self.kind
+ }
+}
+impl std::fmt::Display for Trivia {
+ fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+ std::fmt::Display::fmt(self.syntax(), f)
+ }
+}
impl std::fmt::Display for Expr {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
std::fmt::Display::fmt(self.syntax(), f)
crates/jrsonnet-rowan-parser/src/generated/syntax_kinds.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/generated/syntax_kinds.rs
+++ b/crates/jrsonnet-rowan-parser/src/generated/syntax_kinds.rs
@@ -174,7 +174,6 @@
SELF_KW,
#[token("super")]
SUPER_KW,
- META_FORCE_ENUM,
#[token("for")]
FOR_KW,
#[token("assert")]
@@ -253,10 +252,11 @@
BINARY_OPERATOR,
UNARY_OPERATOR,
LITERAL,
- STRING,
+ TEXT,
NUMBER,
IMPORT_KIND,
VISIBILITY,
+ TRIVIA,
#[doc(hidden)]
__LAST,
}
@@ -277,8 +277,8 @@
pub fn is_enum(self) -> bool {
match self {
EXPR | OBJ_BODY | COMP_SPEC | BIND | MEMBER | FIELD | FIELD_NAME | DESTRUCT
- | DESTRUCT_ARRAY_PART | BINARY_OPERATOR | UNARY_OPERATOR | LITERAL | STRING
- | NUMBER | IMPORT_KIND | VISIBILITY => true,
+ | DESTRUCT_ARRAY_PART | BINARY_OPERATOR | UNARY_OPERATOR | LITERAL | TEXT | NUMBER
+ | IMPORT_KIND | VISIBILITY | TRIVIA => true,
_ => false,
}
}
crates/jrsonnet-rowan-parser/src/lex.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/lex.rs
+++ b/crates/jrsonnet-rowan-parser/src/lex.rs
@@ -4,7 +4,10 @@
use logos::Logos;
use rowan::{TextRange, TextSize};
-use crate::SyntaxKind;
+use crate::{
+ string_block::{lex_str_block, StringBlockError},
+ SyntaxKind,
+};
pub struct Lexer<'a> {
inner: logos::Lexer<'a, SyntaxKind>,
@@ -22,9 +25,34 @@
type Item = Lexeme<'a>;
fn next(&mut self) -> Option<Self::Item> {
- let kind = self.inner.next()?;
+ use SyntaxKind::*;
+
+ let mut kind = self.inner.next()?;
let text = self.inner.slice();
+ if kind == STRING_BLOCK {
+ // We use custom lexer, which skips enough bytes, but not returns error
+ // Instead we should call lexer again to verify if there is something wrong with string block
+ let mut lexer = logos::Lexer::<SyntaxKind>::new(text);
+ // In kinds, string blocks is parsed at least as `|||`
+ lexer.bump(3);
+ let res = lex_str_block(&mut lexer);
+ debug_assert!(lexer.next().is_none(), "str_block is lexed");
+ match res {
+ Ok(_) => {}
+ Err(e) => {
+ kind = match e {
+ StringBlockError::UnexpectedEnd => ERROR_STRING_BLOCK_UNEXPECTED_END,
+ StringBlockError::MissingNewLine => ERROR_STRING_BLOCK_MISSING_NEW_LINE,
+ StringBlockError::MissingTermination => {
+ ERROR_STRING_BLOCK_MISSING_TERMINATION
+ }
+ StringBlockError::MissingIndent => ERROR_STRING_BLOCK_MISSING_INDENT,
+ }
+ }
+ }
+ }
+
Some(Self::Item {
kind,
text,
crates/jrsonnet-rowan-parser/src/lib.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/lib.rs
+++ b/crates/jrsonnet-rowan-parser/src/lib.rs
@@ -2,7 +2,6 @@
mod ast;
mod binary;
-mod classify;
mod event;
mod generated;
mod language;
crates/jrsonnet-rowan-parser/src/marker.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/marker.rs
+++ b/crates/jrsonnet-rowan-parser/src/marker.rs
@@ -44,10 +44,10 @@
!kind.is_enum(),
"{kind:?} is a enum kind, you should use variant kinds instead"
);
- // TODO: is_parser should return true if enum variant has #[regex]/#[token] over it
+ // TODO: is_lexer should return true if enum variant has #[regex]/#[token] over it, or it is defined as lexer error explicitly
// debug_assert!(
- // !kind.is_parser(),
- // "{kind:?} should be only emitted by parser, not used directly"
+ // !kind.is_lexer(),
+ // "{kind:?} should be only emitted by lexer, not used directly"
// );
let event_at_pos = &mut p.events[self.start_event_idx];
assert_eq!(*event_at_pos, Event::Pending);
crates/jrsonnet-rowan-parser/src/parser.rsdiffbeforeafterboth--- a/crates/jrsonnet-rowan-parser/src/parser.rs
+++ b/crates/jrsonnet-rowan-parser/src/parser.rs
@@ -8,10 +8,10 @@
event::Event,
lex::Lexeme,
marker::{AsRange, CompletedMarker, Marker, Ranger},
- string_block::{lex_str_block, StringBlockError},
+ nodes::{Literal, Number, Text, Trivia},
token_set::SyntaxKindSet,
unary::UnaryOperator,
- SyntaxKind,
+ AstToken, SyntaxKind,
SyntaxKind::*,
SyntaxNode, T, TS,
};
@@ -36,6 +36,7 @@
}
pub struct Parser<'i> {
+ // TODO: remove all trivia before feeding to parser?
lexemes: &'i [Lexeme<'i>],
pub offset: usize,
pub events: Vec<Event>,
@@ -191,7 +192,7 @@
while self
.lexemes
.get(previous_token_idx)
- .map_or(false, |l| l.kind.is_trivia())
+ .map_or(false, |l| Trivia::can_cast(l.kind))
&& previous_token_idx != 0
{
previous_token_idx -= 1;
@@ -200,13 +201,13 @@
Some(self.lexemes[previous_token_idx])
}
pub fn start_of_token(&self, mut idx: usize) -> TextSize {
- while self.lexemes[idx].kind.is_trivia() {
+ while Trivia::can_cast(self.lexemes[idx].kind) {
idx += 1;
}
self.lexemes[idx].range.start()
}
pub fn end_of_token(&self, mut idx: usize) -> TextSize {
- while self.lexemes[idx].kind.is_trivia() {
+ while Trivia::can_cast(self.lexemes[idx].kind) {
idx -= 1;
}
self.lexemes[idx].range.end()
@@ -267,7 +268,11 @@
self.bump();
Some(m.complete(self, SyntaxKind::ERROR))
}
-
+ fn bump_assert(&mut self, kind: SyntaxKind) {
+ self.skip_trivia();
+ assert!(self.at(kind), "expected {:?}", kind);
+ self.bump_remap(self.current());
+ }
fn bump(&mut self) {
self.skip_trivia();
self.bump_remap(self.current());
@@ -314,7 +319,7 @@
while self
.lexemes
.get(offset)
- .map(|l| l.kind.is_trivia())
+ .map(|l| Trivia::can_cast(l.kind))
.unwrap_or(false)
{
offset += 1;
@@ -324,7 +329,7 @@
while self
.lexemes
.get(offset)
- .map(|l| l.kind.is_trivia())
+ .map(|l| Trivia::can_cast(l.kind))
.unwrap_or(false)
{
offset += 1;
@@ -335,14 +340,10 @@
self.nth(0)
}
fn skip_trivia(&mut self) {
- while self.peek_raw().is_trivia() {
+ while Trivia::can_cast(self.peek_raw()) {
self.offset += 1;
}
}
- fn current_lexeme(&mut self) -> Option<&Lexeme> {
- self.skip_trivia();
- self.lexemes.get(self.offset)
- }
fn peek_raw(&mut self) -> SyntaxKind {
self.lexemes
.get(self.offset)
@@ -516,8 +517,8 @@
} else if p.at(IDENT) {
name(p);
m.complete(p, FIELD_NAME_FIXED);
- } else if p.current().is_string() {
- string(p);
+ } else if Text::can_cast(p.current()) {
+ text(p);
m.complete(p, FIELD_NAME_FIXED);
} else {
p.error_with_recovery_set(TS![;]);
@@ -564,9 +565,8 @@
};
}
fn assertion(p: &mut Parser) {
- assert!(p.at(T![assert]));
let m = p.start();
- p.bump();
+ p.bump_assert(T![assert]);
expr(p).map(|c| c.wrap(p, LHS_EXPR));
if p.at(T![:]) {
p.bump();
@@ -575,10 +575,9 @@
m.complete(p, ASSERTION);
}
fn object(p: &mut Parser) -> CompletedMarker {
- assert!(p.at(T!['{']));
let m_t = p.start();
let m = p.start();
- p.bump();
+ p.bump_assert(T!['{']);
loop {
if p.at(T!['}']) {
@@ -619,9 +618,8 @@
m.complete(p, PARAM);
}
fn params_desc(p: &mut Parser) -> CompletedMarker {
- assert!(p.at(T!['(']));
let m = p.start();
- p.bump();
+ p.bump_assert(T!['(']);
loop {
if p.at(T![')']) {
@@ -640,8 +638,7 @@
}
fn args_desc(p: &mut Parser) {
let m = p.start();
- assert!(p.at(T!['(']));
- p.bump();
+ p.bump_assert(T!['(']);
let started_named = Cell::new(false);
@@ -674,10 +671,9 @@
}
fn array(p: &mut Parser) -> CompletedMarker {
- assert!(p.at(T!['[']));
// Start the list node
let m = p.start();
- p.bump(); // '['
+ p.bump_assert(T!['[']);
// This vec will have at most one element in case of correct input
let mut compspecs = Vec::with_capacity(1);
@@ -795,9 +791,8 @@
m.complete(p, NAME);
}
fn destruct_rest(p: &mut Parser) {
- assert!(p.at(T![...]));
- p.bump();
let m = p.start();
+ p.bump_assert(T![...]);
if p.at(IDENT) {
p.bump()
}
@@ -817,9 +812,8 @@
m.complete(p, DESTRUCT_OBJECT_FIELD);
}
fn obj_local(p: &mut Parser) {
- assert!(p.at(T![local]));
let m = p.start();
- p.bump();
+ p.bump_assert(T![local]);
bind(p);
m.complete(p, OBJ_LOCAL);
}
@@ -903,52 +897,29 @@
m.complete(p, BIND_DESTRUCT)
};
}
-fn string(p: &mut Parser) {
- assert!(p.current().is_string());
- if p.at(STRING_BLOCK) {
- // We use custom lexer, which skips enough bytes, but not returns error
- // Instead we should call lexer again to verify if there is something wrong with string block
- let mut lexer = logos::Lexer::<SyntaxKind>::new(dbg!(
- &p.current_lexeme().expect("parser is at string block").text
- ));
- // In kinds, string blocks is parsed at least as `|||`
- lexer.bump(3);
- let res = lex_str_block(&mut lexer);
- debug_assert!(lexer.next().is_none(), "str_block is lexed");
- match res {
- Ok(_) => {
- p.bump();
- }
- Err(e) => p.bump_remap(match e {
- StringBlockError::UnexpectedEnd => ERROR_STRING_BLOCK_UNEXPECTED_END,
- StringBlockError::MissingNewLine => ERROR_STRING_BLOCK_MISSING_NEW_LINE,
- StringBlockError::MissingTermination => ERROR_STRING_BLOCK_MISSING_TERMINATION,
- StringBlockError::MissingIndent => ERROR_STRING_BLOCK_MISSING_INDENT,
- }),
- }
- } else {
- p.bump();
- }
+fn text(p: &mut Parser) {
+ assert!(Text::can_cast(p.current()));
+ p.bump();
}
fn number(p: &mut Parser) {
- assert!(p.current().is_number());
+ assert!(Number::can_cast(p.current()));
p.bump();
}
fn literal(p: &mut Parser) {
- assert!(p.current().is_literal());
+ assert!(Literal::can_cast(p.current()));
p.bump();
}
fn lhs_basic(p: &mut Parser) -> Option<CompletedMarker> {
let _e = p.expected_syntax_name("value");
- Some(if p.current().is_literal() {
+ Some(if Literal::can_cast(p.current()) {
let m = p.start();
literal(p);
m.complete(p, EXPR_LITERAL)
- } else if p.current().is_string() {
+ } else if Text::can_cast(p.current()) {
let m = p.start();
- string(p);
+ text(p);
m.complete(p, EXPR_STRING)
- } else if p.current().is_number() {
+ } else if Number::can_cast(p.current()) {
let m = p.start();
number(p);
m.complete(p, EXPR_NUMBER)
@@ -1025,7 +996,7 @@
} else if p.at(T![import]) || p.at(T![importstr]) || p.at(T![importbin]) {
let m = p.start();
p.bump();
- string(p);
+ text(p);
m.complete(p, EXPR_IMPORT)
} else if p.at(T![-]) || p.at(T![!]) || p.at(T![~]) {
let op = match p.current() {
@@ -1044,8 +1015,7 @@
let m = p.start();
p.bump();
expr(p);
- assert!(p.at(T![')']));
- p.bump();
+ p.expect(T![')']);
m.complete(p, EXPR_PARENED)
} else {
p.error_with_recovery_set(TS![]);
xtask/src/sourcegen/kinds.rsdiffbeforeafterboth1#[derive(Debug)]2pub struct KindsSrc {3 /// Key - how this token appears in ungrammar4 defined_tokens: IndexMap<String, TokenKind>,5 defined_node_names: HashSet<String>,6 pub nodes: Vec<String>,7}89#[derive(Debug, Clone)]10pub enum TokenKind {11 /// May exist in token tree, but never in source code12 Meta { grammar_name: String, name: String },13 /// Specific parsing errors may be emitted as this type of kind14 Error {15 grammar_name: String,16 name: String,17 regex: Option<String>,18 priority: Option<u32>,19 },20 /// Keyword - literal match of token21 Keyword {22 /// How this keyword appears in grammar/code, should be same as Kinds key23 code: String,24 name: String,25 },26 /// Literal - something defined by user, i.e strings, identifiers, smth27 Literal {28 /// How this keyword appears in grammar, should be same as Kinds key29 grammar_name: String,30 name: String,31 /// Regex for Logos lexer32 regex: String,33 /// Path to custom lexer34 lexer: Option<String>,35 },36}3738impl TokenKind {39 pub fn grammar_name(&self) -> &str {40 match self {41 TokenKind::Keyword { code, .. } => code,42 TokenKind::Literal { grammar_name, .. } => grammar_name,43 TokenKind::Meta { grammar_name, .. } => grammar_name,44 TokenKind::Error { grammar_name, .. } => grammar_name,45 }46 }47 /// How this keyword should appear in kinds enum, screaming snake cased48 pub fn name(&self) -> &str {49 match self {50 TokenKind::Keyword { name, .. } => name,51 TokenKind::Literal { name, .. } => name,52 TokenKind::Meta { name, .. } => name,53 TokenKind::Error { name, .. } => name,54 }55 }56 pub fn expand_kind(&self) -> TokenStream {57 let name = format_ident!("{}", self.name());58 let attr = match self {59 TokenKind::Keyword { code, .. } => quote! {#[token(#code)]},60 TokenKind::Literal { regex, lexer, .. } => {61 let lexer = lexer62 .as_deref()63 .map(TokenStream::from_str)64 .map(|r| r.expect("path is correct"));65 quote! {#[regex(#regex, #lexer)]}66 }67 TokenKind::Error {68 regex, priority, ..69 } if regex.is_some() => {70 let priority = priority.map(|p| quote! {, priority = #p});71 quote! {#[regex(#regex #priority)]}72 }73 _ => quote! {},74 };75 quote! {76 #attr77 #name78 }79 }80 pub fn expand_t_macros(&self) -> Option<TokenStream> {81 match self {82 TokenKind::Keyword { code, name } => {83 let code = escape_token_macro(code);84 let name = format_ident!("{name}");85 Some(quote! {86 [#code] => {$crate::SyntaxKind::#name}87 })88 }89 // Meta items should not appear in T![_]90 _ => None,91 }92 }9394 /// How this token should be referenced in code95 /// Keywords are referenced with `T![_]` macro,96 /// and literals are referenced directly by name97 pub fn reference(&self) -> TokenStream {98 match self {99 TokenKind::Keyword { code, .. } => {100 let code = escape_token_macro(code);101 quote! {T![#code]}102 }103 _ => {104 let name = self.name();105 let ident = format_ident!("{name}");106 quote! {#ident}107 }108 }109 }110111 pub fn method_name(&self) -> Ident {112 match self {113 TokenKind::Keyword { name, .. } => {114 format_ident!("{}_token", name.to_lowercase())115 }116 TokenKind::Literal { name, .. } => {117 format_ident!("{}_lit", name.to_lowercase())118 }119 TokenKind::Meta { name, .. } => format_ident!("{}_meta", name.to_lowercase()),120 TokenKind::Error { name, .. } => format_ident!("{}_error", name.to_lowercase()),121 }122 }123}124125#[macro_export]126macro_rules! define_kinds {127 ($into:ident = lit($name:literal) => $regex:literal $(, $lexer:literal)? $(; $($rest:tt)*)?) => {{128 $into.define_token(TokenKind::Literal {129 grammar_name: format!("LIT_{}!", $name),130 name: $name.to_owned(),131 regex: $regex.to_owned(),132 lexer: None $(.or_else(|| Some($lexer.to_string())))?,133 });134 $(define_kinds!($into = $($rest)*))?135 }};136 ($into:ident = error($name:literal$(, priority = $priority:literal)?) $(=> $regex:literal)? $(; $($rest:tt)*)?) => {{137 $into.define_token(TokenKind::Error {138 grammar_name: format!("ERROR_{}!", $name),139 name: format!("ERROR_{}", $name),140 regex: None$(.or(Some($regex.to_owned())))?,141 priority: None$(.or(Some($priority)))?,142 });143 $(define_kinds!($into = $($rest)*))?144 }};145 ($into:ident = $tok:literal => $name:literal $(; $($rest:tt)*)?) => {{146 $into.define_token(TokenKind::Keyword {147 code: format!("{}", $tok),148 name: $name.to_owned(),149 });150 $(define_kinds!($into = $($rest)*))?151 }};152 ($into:ident =) => {{}}153}154use std::{collections::HashSet, str::FromStr};155156pub use define_kinds;157use indexmap::IndexMap;158use proc_macro2::{Ident, TokenStream};159use quote::{format_ident, quote};160161use super::escape_token_macro;162163impl KindsSrc {164 pub fn new() -> Self {165 Self {166 defined_tokens: IndexMap::new(),167 defined_node_names: HashSet::new(),168 nodes: Vec::new(),169 }170 }171 pub fn define_token(&mut self, token: TokenKind) {172 assert!(173 self.defined_node_names.insert(token.name().to_owned()),174 "node name already defined: {}",175 token.name()176 );177 assert!(178 self.defined_tokens179 .insert(token.grammar_name().to_owned(), token.clone())180 .is_none(),181 "token already defined: {}",182 token.grammar_name()183 )184 }185 pub fn define_node(&mut self, node: &str) {186 assert!(187 self.defined_node_names.insert(node.to_owned()),188 "node name already defined: {}",189 node190 );191 self.nodes.push(node.to_string())192 }193 pub fn token(&self, tok: &str) -> Option<&TokenKind> {194 self.defined_tokens.get(tok)195 }196 pub fn is_token(&self, tok: &str) -> bool {197 self.defined_tokens.contains_key(tok)198 }199 pub fn tokens(&self) -> impl Iterator<Item = &TokenKind> {200 self.defined_tokens.iter().map(|(_, v)| v)201 }202}203204pub fn jsonnet_kinds() -> KindsSrc {205 let mut kinds = KindsSrc::new();206 define_kinds![kinds =207 "||" => "OR";208 "&&" => "AND";209 "|" => "BIT_OR";210 "^" => "BIT_XOR";211 "&" => "BIT_AND";212 "==" => "EQ";213 "!=" => "NE";214 "<" => "LT";215 ">" => "GT";216 "<=" => "LE";217 ">=" => "GE";218 "<<" => "LHS";219 ">>" => "RHS";220 "+" => "PLUS";221 "-" => "MINUS";222 "*" => "MUL";223 "/" => "DIV";224 "%" => "MODULO";225 "!" => "NOT";226 "~" => "BIT_NOT";227 "[" => "L_BRACK";228 "]" => "R_BRACK";229 "(" => "L_PAREN";230 ")" => "R_PAREN";231 "{" => "L_BRACE";232 "}" => "R_BRACE";233 ":" => "COLON";234 "::" => "COLONCOLON";235 ":::" => "COLONCOLONCOLON";236 ";" => "SEMI";237 "." => "DOT";238 "..." => "DOTDOTDOT";239 "," => "COMMA";240 "$" => "DOLLAR";241 "=" => "ASSIGN";242 "?" => "QUESTION_MARK";243 "$intrinsicThisFile" => "INTRINSIC_THIS_FILE";244 "$intrinsicId" => "INTRINSIC_ID";245 "$intrinsic" => "INTRINSIC";246 // Literals247 lit("FLOAT") => r"(?:0|[1-9][0-9]*)(?:\.[0-9]+)?(?:[eE][+-]?[0-9]+)?";248 error("FLOAT_JUNK_AFTER_POINT") => r"(?:0|[1-9][0-9]*)\.[^0-9]";249 error("FLOAT_JUNK_AFTER_EXPONENT") => r"(?:0|[1-9][0-9]*)(?:\.[0-9]+)?[eE][^+\-0-9]";250 error("FLOAT_JUNK_AFTER_EXPONENT_SIGN") => r"(?:0|[1-9][0-9]*)(?:\.[0-9]+)?[eE][+-][^0-9]";251 lit("STRING_DOUBLE") => "\"(?s:[^\"\\\\]|\\\\.)*\"";252 error("STRING_DOUBLE_UNTERMINATED") => "\"(?s:[^\"\\\\]|\\\\.)*";253 lit("STRING_SINGLE") => "'(?s:[^'\\\\]|\\\\.)*'";254 error("STRING_SINGLE_UNTERMINATED") => "'(?s:[^'\\\\]|\\\\.)*";255 lit("STRING_DOUBLE_VERBATIM") => "@\"(?:[^\"]|\"\")*\"";256 error("STRING_DOUBLE_VERBATIM_UNTERMINATED") => "@\"(?:[^\"]|\"\")*";257 lit("STRING_SINGLE_VERBATIM") => "@'(?:[^']|'')*'";258 error("STRING_SINGLE_VERBATIM_UNTERMINATED") => "@'(?:[^']|'')*";259 error("STRING_VERBATIM_MISSING_QUOTES") => "@[^\"'\\s]\\S+";260 lit("STRING_BLOCK") => r"\|\|\|", "crate::string_block::lex_str_block_test";261 error("STRING_BLOCK_UNEXPECTED_END");262 error("STRING_BLOCK_MISSING_NEW_LINE");263 error("STRING_BLOCK_MISSING_TERMINATION");264 error("STRING_BLOCK_MISSING_INDENT");265 lit("IDENT") => r"[_a-zA-Z][_a-zA-Z0-9]*";266 lit("WHITESPACE") => r"[ \t\n\r]+";267 lit("SINGLE_LINE_SLASH_COMMENT") => r"//[^\r\n]*(\r\n|\n)?";268 lit("SINGLE_LINE_HASH_COMMENT") => r"#[^\r\n]*(\r\n|\n)?";269 lit("MULTI_LINE_COMMENT") => r"/\*([^*]|\*[^/])*\*/";270 error("COMMENT_TOO_SHORT") => r"/\*/";271 error("COMMENT_UNTERMINATED") => r"/\*([^*]|\*[^/])+";272 ];273 kinds274}1#[derive(Debug)]2pub struct KindsSrc {3 /// Key - how this token appears in ungrammar4 defined_tokens: IndexMap<String, TokenKind>,5 defined_node_names: HashSet<String>,6 pub nodes: Vec<String>,7}89#[derive(Debug, Clone)]10pub enum TokenKind {11 /// May exist in token tree, but never in source code12 Meta { grammar_name: String, name: String },13 /// Specific parsing/lexing errors may be emitted as this type of kind14 Error {15 grammar_name: String,16 name: String,17 /// Is this error returned by lexer directly, or from lex.rs18 is_lexer_error: bool,19 regex: Option<String>,20 priority: Option<u32>,21 },22 /// Keyword - literal match of token23 Keyword {24 /// How this keyword appears in grammar/code, should be same as Kinds key25 code: String,26 name: String,27 },28 /// Literal - something defined by user, i.e strings, identifiers, smth29 Literal {30 /// How this keyword appears in grammar, should be same as Kinds key31 grammar_name: String,32 name: String,33 /// Regex for Logos lexer34 regex: String,35 /// Path to custom lexer36 lexer: Option<String>,37 },38}3940impl TokenKind {41 pub fn grammar_name(&self) -> &str {42 match self {43 TokenKind::Keyword { code, .. } => code,44 TokenKind::Literal { grammar_name, .. } => grammar_name,45 TokenKind::Meta { grammar_name, .. } => grammar_name,46 TokenKind::Error { grammar_name, .. } => grammar_name,47 }48 }49 /// How this keyword should appear in kinds enum, screaming snake cased50 pub fn name(&self) -> &str {51 match self {52 TokenKind::Keyword { name, .. } => name,53 TokenKind::Literal { name, .. } => name,54 TokenKind::Meta { name, .. } => name,55 TokenKind::Error { name, .. } => name,56 }57 }58 pub fn expand_kind(&self) -> TokenStream {59 let name = format_ident!("{}", self.name());60 let attr = match self {61 TokenKind::Keyword { code, .. } => quote! {#[token(#code)]},62 TokenKind::Literal { regex, lexer, .. } => {63 let lexer = lexer64 .as_deref()65 .map(TokenStream::from_str)66 .map(|r| r.expect("path is correct"));67 quote! {#[regex(#regex, #lexer)]}68 }69 TokenKind::Error {70 regex, priority, ..71 } if regex.is_some() => {72 let priority = priority.map(|p| quote! {, priority = #p});73 quote! {#[regex(#regex #priority)]}74 }75 _ => quote! {},76 };77 quote! {78 #attr79 #name80 }81 }82 pub fn expand_t_macros(&self) -> Option<TokenStream> {83 match self {84 TokenKind::Keyword { code, name } => {85 let code = escape_token_macro(code);86 let name = format_ident!("{name}");87 Some(quote! {88 [#code] => {$crate::SyntaxKind::#name}89 })90 }91 // Meta items should not appear in T![_]92 _ => None,93 }94 }9596 /// How this token should be referenced in code97 /// Keywords are referenced with `T![_]` macro,98 /// and literals are referenced directly by name99 pub fn reference(&self) -> TokenStream {100 match self {101 TokenKind::Keyword { code, .. } => {102 let code = escape_token_macro(code);103 quote! {T![#code]}104 }105 _ => {106 let name = self.name();107 let ident = format_ident!("{name}");108 quote! {#ident}109 }110 }111 }112113 pub fn method_name(&self) -> Ident {114 match self {115 TokenKind::Keyword { name, .. } => {116 format_ident!("{}_token", name.to_lowercase())117 }118 TokenKind::Literal { name, .. } => {119 format_ident!("{}_lit", name.to_lowercase())120 }121 TokenKind::Meta { name, .. } => format_ident!("{}_meta", name.to_lowercase()),122 TokenKind::Error { name, .. } => format_ident!("{}_error", name.to_lowercase()),123 }124 }125}126127#[macro_export]128macro_rules! define_kinds {129 ($into:ident = lit($name:literal) => $regex:literal $(, $lexer:literal)? $(; $($rest:tt)*)?) => {{130 $into.define_token(TokenKind::Literal {131 grammar_name: format!("LIT_{}!", $name),132 name: $name.to_owned(),133 regex: $regex.to_owned(),134 lexer: None $(.or_else(|| Some($lexer.to_string())))?,135 });136 $(define_kinds!($into = $($rest)*))?137 }};138 ($into:ident = error($name:literal$(, priority = $priority:literal)? $(, lexer = $lexer:literal)?) $(=> $regex:literal)? $(; $($rest:tt)*)?) => {{139 {140 let regex = None$(.or(Some($regex.to_owned())))?;141 let priority = None$(.or(Some($priority)))?;142 $into.define_token(TokenKind::Error {143 grammar_name: format!("ERROR_{}!", $name),144 name: format!("ERROR_{}", $name),145 is_lexer_error: false $(|| $lexer)? || regex.is_some() || priority.is_some(),146 regex,147 priority,148 });149 }150 $(define_kinds!($into = $($rest)*))?151 }};152 ($into:ident = $tok:literal => $name:literal $(; $($rest:tt)*)?) => {{153 $into.define_token(TokenKind::Keyword {154 code: format!("{}", $tok),155 name: $name.to_owned(),156 });157 $(define_kinds!($into = $($rest)*))?158 }};159 ($into:ident =) => {{}}160}161use std::{collections::HashSet, str::FromStr};162163pub use define_kinds;164use indexmap::IndexMap;165use proc_macro2::{Ident, TokenStream};166use quote::{format_ident, quote};167168use super::escape_token_macro;169170impl KindsSrc {171 pub fn new() -> Self {172 Self {173 defined_tokens: IndexMap::new(),174 defined_node_names: HashSet::new(),175 nodes: Vec::new(),176 }177 }178 pub fn define_token(&mut self, token: TokenKind) {179 assert!(180 self.defined_node_names.insert(token.name().to_owned()),181 "node name already defined: {}",182 token.name()183 );184 assert!(185 self.defined_tokens186 .insert(token.grammar_name().to_owned(), token.clone())187 .is_none(),188 "token already defined: {}",189 token.grammar_name()190 )191 }192 pub fn define_node(&mut self, node: &str) {193 assert!(194 self.defined_node_names.insert(node.to_owned()),195 "node name already defined: {}",196 node197 );198 self.nodes.push(node.to_string())199 }200 pub fn token(&self, tok: &str) -> Option<&TokenKind> {201 self.defined_tokens.get(tok)202 }203 pub fn is_token(&self, tok: &str) -> bool {204 self.defined_tokens.contains_key(tok)205 }206 pub fn tokens(&self) -> impl Iterator<Item = &TokenKind> {207 self.defined_tokens.iter().map(|(_, v)| v)208 }209}210211pub fn jsonnet_kinds() -> KindsSrc {212 let mut kinds = KindsSrc::new();213 define_kinds![kinds =214 "||" => "OR";215 "&&" => "AND";216 "|" => "BIT_OR";217 "^" => "BIT_XOR";218 "&" => "BIT_AND";219 "==" => "EQ";220 "!=" => "NE";221 "<" => "LT";222 ">" => "GT";223 "<=" => "LE";224 ">=" => "GE";225 "<<" => "LHS";226 ">>" => "RHS";227 "+" => "PLUS";228 "-" => "MINUS";229 "*" => "MUL";230 "/" => "DIV";231 "%" => "MODULO";232 "!" => "NOT";233 "~" => "BIT_NOT";234 "[" => "L_BRACK";235 "]" => "R_BRACK";236 "(" => "L_PAREN";237 ")" => "R_PAREN";238 "{" => "L_BRACE";239 "}" => "R_BRACE";240 ":" => "COLON";241 "::" => "COLONCOLON";242 ":::" => "COLONCOLONCOLON";243 ";" => "SEMI";244 "." => "DOT";245 "..." => "DOTDOTDOT";246 "," => "COMMA";247 "$" => "DOLLAR";248 "=" => "ASSIGN";249 "?" => "QUESTION_MARK";250 "$intrinsicThisFile" => "INTRINSIC_THIS_FILE";251 "$intrinsicId" => "INTRINSIC_ID";252 "$intrinsic" => "INTRINSIC";253 // Literals254 lit("FLOAT") => r"(?:0|[1-9][0-9]*)(?:\.[0-9]+)?(?:[eE][+-]?[0-9]+)?";255 error("FLOAT_JUNK_AFTER_POINT") => r"(?:0|[1-9][0-9]*)\.[^0-9]";256 error("FLOAT_JUNK_AFTER_EXPONENT") => r"(?:0|[1-9][0-9]*)(?:\.[0-9]+)?[eE][^+\-0-9]";257 error("FLOAT_JUNK_AFTER_EXPONENT_SIGN") => r"(?:0|[1-9][0-9]*)(?:\.[0-9]+)?[eE][+-][^0-9]";258 lit("STRING_DOUBLE") => "\"(?s:[^\"\\\\]|\\\\.)*\"";259 error("STRING_DOUBLE_UNTERMINATED") => "\"(?s:[^\"\\\\]|\\\\.)*";260 lit("STRING_SINGLE") => "'(?s:[^'\\\\]|\\\\.)*'";261 error("STRING_SINGLE_UNTERMINATED") => "'(?s:[^'\\\\]|\\\\.)*";262 lit("STRING_DOUBLE_VERBATIM") => "@\"(?:[^\"]|\"\")*\"";263 error("STRING_DOUBLE_VERBATIM_UNTERMINATED") => "@\"(?:[^\"]|\"\")*";264 lit("STRING_SINGLE_VERBATIM") => "@'(?:[^']|'')*'";265 error("STRING_SINGLE_VERBATIM_UNTERMINATED") => "@'(?:[^']|'')*";266 error("STRING_VERBATIM_MISSING_QUOTES") => "@[^\"'\\s]\\S+";267 lit("STRING_BLOCK") => r"\|\|\|", "crate::string_block::lex_str_block_test";268 error("STRING_BLOCK_UNEXPECTED_END", lexer = true);269 error("STRING_BLOCK_MISSING_NEW_LINE", lexer = true);270 error("STRING_BLOCK_MISSING_TERMINATION", lexer = true);271 error("STRING_BLOCK_MISSING_INDENT", lexer = true);272 lit("IDENT") => r"[_a-zA-Z][_a-zA-Z0-9]*";273 lit("WHITESPACE") => r"[ \t\n\r]+";274 lit("SINGLE_LINE_SLASH_COMMENT") => r"//[^\r\n]*(\r\n|\n)?";275 lit("SINGLE_LINE_HASH_COMMENT") => r"#[^\r\n]*(\r\n|\n)?";276 lit("MULTI_LINE_COMMENT") => r"/\*([^*]|\*[^/])*\*/";277 error("COMMENT_TOO_SHORT") => r"/\*/";278 error("COMMENT_UNTERMINATED") => r"/\*([^*]|\*[^/])+";279 ];280 kinds281}xtask/src/sourcegen/mod.rsdiffbeforeafterboth--- a/xtask/src/sourcegen/mod.rs
+++ b/xtask/src/sourcegen/mod.rs
@@ -48,20 +48,28 @@
if let Some((special, name)) = classify_special(token) {
match special {
SpecialName::Literal => panic!("literal is not defined: {name}"),
- SpecialName::Meta => kinds.define_token(TokenKind::Meta {
- grammar_name: token.to_owned(),
- name: format!("META_{}", name),
- }),
- SpecialName::Error => kinds.define_token(TokenKind::Error {
- grammar_name: token.to_owned(),
- name: format!("ERROR_{}", name),
- regex: None,
- priority: None,
- }),
+ SpecialName::Meta => {
+ eprintln!("implicit meta: {}", name);
+ kinds.define_token(TokenKind::Meta {
+ grammar_name: token.to_owned(),
+ name: format!("META_{}", name),
+ })
+ }
+ SpecialName::Error => {
+ eprintln!("implicit error: {}", name);
+ kinds.define_token(TokenKind::Error {
+ grammar_name: token.to_owned(),
+ name: format!("ERROR_{}", name),
+ regex: None,
+ priority: None,
+ is_lexer_error: true,
+ })
+ }
};
continue;
};
let name = to_upper_snake_case(token);
+ eprintln!("implicit kw: {}", token);
kinds.define_token(TokenKind::Keyword {
code: token.to_owned(),
name: format!("{name}_KW"),
xtask/src/sourcegen/util.rsdiffbeforeafterboth--- a/xtask/src/sourcegen/util.rs
+++ b/xtask/src/sourcegen/util.rs
@@ -13,10 +13,7 @@
}
}
- eprintln!(" {} was not up-to-date, updating\n", file.display());
- if std::env::var("CI").is_ok() {
- eprintln!("NOTE: run `cargo xtask` locally and commit the updated files\n");
- }
+ eprintln!("{} was not up-to-date, updating", file.display());
if let Some(parent) = file.parent() {
let _ = fs::create_dir_all(parent);
}