#[cfg(feature = "bincode")]
use bincode::{Decode, Encode};
use lazy_static::lazy_static;
use num_traits::PrimInt;
use regex::Regex;
#[cfg(feature = "serde")]
use serde::{Deserialize, Serialize};
use std::{
collections::{hash_map::Entry, HashMap},
error::Error,
fmt,
str::FromStr,
};
pub type YaccGrammarResult<T> = Result<T, Vec<YaccGrammarError>>;
use crate::{
header::{GrmtoolsSectionParser, HeaderErrorKind, Namespaced, Setting, Value},
Span, Spanned,
};
use super::{
ast::{GrammarAST, Symbol},
AssocKind, Precedence, YaccKind, YaccKindResolver, YaccOriginalActionKind,
};
#[derive(Debug, PartialEq, Eq, Clone)]
#[non_exhaustive]
pub enum YaccGrammarErrorKind {
IllegalInteger,
IllegalName,
IllegalString,
IncompleteRule,
IncompleteComment,
IncompleteAction,
MissingColon,
MissingRightArrow,
MismatchedBrace,
NonEmptyProduction,
PrematureEnd,
ProductionNotTerminated,
ProgramsNotSupported,
UnknownDeclaration,
PrecNotFollowedByToken,
DuplicatePrecedence,
DuplicateAvoidInsertDeclaration,
DuplicateImplicitTokensDeclaration,
DuplicateExpectDeclaration,
DuplicateExpectRRDeclaration,
DuplicateStartDeclaration,
DuplicateActiontypeDeclaration,
DuplicateEPP,
ReachedEOL,
InvalidString,
NoStartRule,
UnknownSymbol,
InvalidStartRule(String),
UnknownRuleRef(String),
UnknownToken(String),
NoPrecForToken(String),
UnknownEPP(String),
ExpectedInput(char),
InvalidYaccKind,
InvalidYaccKindNamespace,
InvalidActionKind,
InvalidActionKindNamespace,
InvalidGrmtoolsSectionEntry,
DuplicateGrmtoolsSectionEntry,
MissingGrmtoolsSection,
}
#[derive(Debug, PartialEq, Eq, Clone)]
pub struct YaccGrammarError {
pub(crate) kind: YaccGrammarErrorKind,
pub(crate) spans: Vec<Span>,
}
impl Error for YaccGrammarError {}
impl fmt::Display for YaccGrammarError {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
write!(f, "{}", self.kind)
}
}
impl fmt::Display for YaccGrammarErrorKind {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
let s = match self {
YaccGrammarErrorKind::ExpectedInput(c) => &format!("Expected input '{c}'"),
YaccGrammarErrorKind::IllegalInteger => "Illegal integer",
YaccGrammarErrorKind::IllegalName => "Illegal name",
YaccGrammarErrorKind::IllegalString => "Illegal string",
YaccGrammarErrorKind::IncompleteRule => "Incomplete rule",
YaccGrammarErrorKind::IncompleteComment => "Incomplete comment",
YaccGrammarErrorKind::IncompleteAction => "Incomplete action",
YaccGrammarErrorKind::MissingColon => "Missing ':'",
YaccGrammarErrorKind::MissingRightArrow => "Missing '->'",
YaccGrammarErrorKind::MismatchedBrace => "Mismatched brace",
YaccGrammarErrorKind::NonEmptyProduction => "%empty used in non-empty production",
YaccGrammarErrorKind::PrematureEnd => "File ends prematurely",
YaccGrammarErrorKind::ProductionNotTerminated => "Production not terminated correctly",
YaccGrammarErrorKind::ProgramsNotSupported => "Programs not currently supported",
YaccGrammarErrorKind::UnknownDeclaration => "Unknown declaration",
YaccGrammarErrorKind::DuplicatePrecedence => "Token has multiple precedences specified",
YaccGrammarErrorKind::PrecNotFollowedByToken => "%prec not followed by token name",
YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration => {
"Duplicated %avoid_insert declaration"
}
YaccGrammarErrorKind::DuplicateExpectDeclaration => "Duplicated %expect declaration",
YaccGrammarErrorKind::DuplicateExpectRRDeclaration => {
"Duplicate %expect-rr declaration"
}
YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration => {
"Duplicated %implicit_tokens declaration"
}
YaccGrammarErrorKind::DuplicateStartDeclaration => "Duplicated %start declaration",
YaccGrammarErrorKind::DuplicateActiontypeDeclaration => {
"Duplicate %actiontype declaration"
}
YaccGrammarErrorKind::DuplicateEPP => "Duplicate %epp declaration for this token",
YaccGrammarErrorKind::ReachedEOL => {
"Reached end of line without finding expected content"
}
YaccGrammarErrorKind::InvalidString => "Invalid string",
YaccGrammarErrorKind::NoStartRule => return write!(f, "No start rule specified"),
YaccGrammarErrorKind::UnknownSymbol => "Unknown symbol, expected a rule or token",
YaccGrammarErrorKind::InvalidStartRule(name) => {
return write!(f, "Start rule '{}' does not appear in grammar", name)
}
YaccGrammarErrorKind::UnknownRuleRef(name) => {
return write!(f, "Unknown reference to rule '{}'", name)
}
YaccGrammarErrorKind::UnknownToken(name) => {
return write!(f, "Unknown token '{}'", name)
}
YaccGrammarErrorKind::NoPrecForToken(name) => {
return write!(
f,
"Token '{}' used in %prec has no precedence attached",
name
)
}
YaccGrammarErrorKind::UnknownEPP(name) => {
return write!(
f,
"Token '{}' in %epp declaration is not referenced in the grammar",
name
)
}
YaccGrammarErrorKind::MissingGrmtoolsSection => "Missing '%grmtools' section",
YaccGrammarErrorKind::DuplicateGrmtoolsSectionEntry => {
"Duplicate entry in %grmtools section"
}
YaccGrammarErrorKind::InvalidGrmtoolsSectionEntry => {
"Invalid entry in %grmtools section"
}
YaccGrammarErrorKind::InvalidYaccKind => "Invalid yacc kind",
YaccGrammarErrorKind::InvalidYaccKindNamespace => "Invalid yacc kind namespace",
YaccGrammarErrorKind::InvalidActionKind => "Invalid action kind",
YaccGrammarErrorKind::InvalidActionKindNamespace => "Invalid action kind namespace",
};
write!(f, "{}", s)
}
}
#[derive(Debug, PartialEq, Eq, Clone)]
#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
#[cfg_attr(feature = "bincode", derive(Encode, Decode))]
#[non_exhaustive]
pub enum YaccGrammarWarningKind {
UnusedRule,
UnusedToken,
}
#[derive(Debug, PartialEq, Eq, Clone)]
#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
#[cfg_attr(feature = "bincode", derive(Encode, Decode))]
pub struct YaccGrammarWarning {
pub(crate) kind: YaccGrammarWarningKind,
pub(crate) spans: Vec<Span>,
}
impl fmt::Display for YaccGrammarWarning {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
write!(f, "{}", self.kind)
}
}
impl fmt::Display for YaccGrammarWarningKind {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
let s = match self {
YaccGrammarWarningKind::UnusedRule => "Unused rule",
YaccGrammarWarningKind::UnusedToken => "Unused token",
};
write!(f, "{}", s)
}
}
impl Spanned for YaccGrammarWarning {
fn spans(&self) -> &[Span] {
self.spans.as_slice()
}
fn spanskind(&self) -> SpansKind {
match self.kind {
YaccGrammarWarningKind::UnusedRule | YaccGrammarWarningKind::UnusedToken => {
SpansKind::Error
}
}
}
}
#[non_exhaustive]
pub enum SpansKind {
DuplicationError,
Error,
}
impl Spanned for YaccGrammarError {
fn spans(&self) -> &[Span] {
self.spans.as_slice()
}
fn spanskind(&self) -> SpansKind {
match self.kind {
YaccGrammarErrorKind::IllegalInteger
| YaccGrammarErrorKind::IllegalName
| YaccGrammarErrorKind::IllegalString
| YaccGrammarErrorKind::IncompleteRule
| YaccGrammarErrorKind::IncompleteComment
| YaccGrammarErrorKind::IncompleteAction
| YaccGrammarErrorKind::MissingColon
| YaccGrammarErrorKind::MissingRightArrow
| YaccGrammarErrorKind::MismatchedBrace
| YaccGrammarErrorKind::NonEmptyProduction
| YaccGrammarErrorKind::PrematureEnd
| YaccGrammarErrorKind::ProductionNotTerminated
| YaccGrammarErrorKind::PrecNotFollowedByToken
| YaccGrammarErrorKind::ProgramsNotSupported
| YaccGrammarErrorKind::UnknownDeclaration
| YaccGrammarErrorKind::ReachedEOL
| YaccGrammarErrorKind::InvalidString
| YaccGrammarErrorKind::NoStartRule
| YaccGrammarErrorKind::UnknownSymbol
| YaccGrammarErrorKind::InvalidStartRule(_)
| YaccGrammarErrorKind::UnknownRuleRef(_)
| YaccGrammarErrorKind::UnknownToken(_)
| YaccGrammarErrorKind::NoPrecForToken(_)
| YaccGrammarErrorKind::MissingGrmtoolsSection
| YaccGrammarErrorKind::InvalidGrmtoolsSectionEntry
| YaccGrammarErrorKind::InvalidYaccKind
| YaccGrammarErrorKind::InvalidYaccKindNamespace
| YaccGrammarErrorKind::InvalidActionKind
| YaccGrammarErrorKind::InvalidActionKindNamespace
| YaccGrammarErrorKind::ExpectedInput(_)
| YaccGrammarErrorKind::UnknownEPP(_) => SpansKind::Error,
YaccGrammarErrorKind::DuplicatePrecedence
| YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration
| YaccGrammarErrorKind::DuplicateExpectDeclaration
| YaccGrammarErrorKind::DuplicateExpectRRDeclaration
| YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration
| YaccGrammarErrorKind::DuplicateStartDeclaration
| YaccGrammarErrorKind::DuplicateActiontypeDeclaration
| YaccGrammarErrorKind::DuplicateGrmtoolsSectionEntry
| YaccGrammarErrorKind::DuplicateEPP => SpansKind::DuplicationError,
}
}
}
pub(crate) struct YaccParser {
yacc_kind_resolver: YaccKindResolver,
yacc_kind: Option<YaccKind>,
src: String,
num_newlines: usize,
ast: GrammarAST,
global_actiontype: Option<(String, Span)>,
}
lazy_static! {
static ref RE_NAME: Regex = Regex::new(r"^[a-zA-Z_.][a-zA-Z0-9_.]*").unwrap();
static ref RE_TOKEN: Regex =
Regex::new("^(?:(\".+?\")|('.+?')|([a-zA-Z_][a-zA-Z_0-9]*))").unwrap();
}
fn add_duplicate_occurrence(
errs: &mut Vec<YaccGrammarError>,
kind: YaccGrammarErrorKind,
orig_span: Span,
dup_span: Span,
) {
if !errs.iter_mut().any(|e| {
if e.kind == kind && e.spans[0] == orig_span {
e.spans.push(dup_span);
true
} else {
false
}
}) {
errs.push(YaccGrammarError {
kind,
spans: vec![orig_span, dup_span],
});
}
}
impl YaccParser {
pub(crate) fn new(yacc_kind_resolver: YaccKindResolver, src: String) -> YaccParser {
YaccParser {
yacc_kind_resolver,
yacc_kind: None,
src,
num_newlines: 0,
ast: GrammarAST::new(),
global_actiontype: None,
}
}
pub(crate) fn parse(&mut self) -> YaccGrammarResult<usize> {
let mut errs: Vec<YaccGrammarError> = Vec::new();
let section_required = matches!(self.yacc_kind_resolver, YaccKindResolver::NoDefault);
let header_parser = GrmtoolsSectionParser::new(&self.src, section_required);
let result = match header_parser.parse() {
Ok((header, i)) => self.update_yacckind(header, i),
Err(es) => {
errs.extend(es.iter().map(|e| YaccGrammarError {
kind: match e.kind {
HeaderErrorKind::MissingGrmtoolsSection => {
YaccGrammarErrorKind::MissingGrmtoolsSection
}
HeaderErrorKind::IllegalName => {
YaccGrammarErrorKind::InvalidGrmtoolsSectionEntry
}
HeaderErrorKind::ExpectedToken(c) => YaccGrammarErrorKind::ExpectedInput(c),
HeaderErrorKind::DuplicateEntry => {
YaccGrammarErrorKind::DuplicateGrmtoolsSectionEntry
}
},
spans: e.spans.clone(),
}));
return Err(errs);
}
};
if result.is_ok() && (self.yacc_kind.is_none() || self.yacc_kind_resolver.forced()) {
match self.yacc_kind_resolver {
YaccKindResolver::Default(kind) | YaccKindResolver::Force(kind) => {
self.yacc_kind = Some(kind);
}
YaccKindResolver::NoDefault => {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKind,
spans: vec![Span::new(0, 0)],
});
return Err(errs);
}
}
}
let mut result = self.parse_declarations(
match result {
Ok(i) => i,
Err(es) => {
errs.extend(es);
return Err(errs);
}
},
&mut errs,
);
result = self.parse_rules(match result {
Ok(i) => i,
Err(e) => {
errs.push(e);
return Err(errs);
}
});
result = self.parse_programs(
match result {
Ok(i) => i,
Err(e) => {
errs.push(e);
return Err(errs);
}
},
&mut errs,
);
match result {
Ok(i) if errs.is_empty() => Ok(i),
Err(e) => {
errs.push(e);
Err(errs)
}
_ => Err(errs),
}
}
fn update_yacckind(
&mut self,
header: HashMap<String, (Span, Value)>,
i: usize,
) -> Result<usize, Vec<YaccGrammarError>> {
if let Some((key_span, yk_setting)) = header.get("yacckind") {
match yk_setting {
Value::Flag(_) => {
return Err(vec![YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKind,
spans: vec![*key_span],
}])
}
Value::Setting(Setting::Num(_, span)) => {
return Err(vec![YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKind,
spans: vec![*span],
}])
}
Value::Setting(Setting::Unitary(Namespaced {
namespace,
member: (yk_value, yk_value_span),
})) => {
let mut errs = vec![];
if let Some((ns, ns_span)) = namespace {
if ns != "yacckind" {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKindNamespace,
spans: vec![*ns_span],
});
}
}
let yacckinds = [
("grmtools".to_string(), YaccKind::Grmtools),
("eco".to_string(), YaccKind::Eco),
];
let yk_found = yacckinds
.iter()
.find_map(|(yk_str, yk)| (yk_str == yk_value).then_some(yk));
if yk_found.is_some() {
if errs.is_empty() {
self.yacc_kind = yk_found.cloned();
return Ok(i);
} else {
return Err(errs);
}
} else {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKind,
spans: vec![*yk_value_span],
});
return Err(errs);
}
}
Value::Setting(Setting::Constructor {
ctor:
Namespaced {
namespace: yk_namespace,
member: (yk_str, yk_span),
},
arg:
Namespaced {
namespace: ak_namespace,
member: (ak_str, ak_span),
},
}) => {
let mut errs = vec![];
if let Some((yk_ns, yk_ns_span)) = yk_namespace {
if yk_ns != "yacckind" {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKindNamespace,
spans: vec![*yk_ns_span],
});
}
}
if yk_str != "original" {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidYaccKind,
spans: vec![*yk_span],
});
}
if let Some((ak_ns, ak_ns_span)) = ak_namespace {
if ak_ns != "yaccoriginalactionkind" {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidActionKindNamespace,
spans: vec![*ak_ns_span],
});
}
}
let actionkinds = [
("noaction", YaccOriginalActionKind::NoAction),
("useraction", YaccOriginalActionKind::UserAction),
("genericparsetree", YaccOriginalActionKind::GenericParseTree),
];
let yk_found = actionkinds.iter().find_map(|(actionkind_str, actionkind)| {
(ak_str == actionkind_str).then_some(YaccKind::Original(*actionkind))
});
if yk_found.is_some() {
if errs.is_empty() {
self.yacc_kind = yk_found;
return Ok(i);
} else {
return Err(errs);
}
} else {
errs.push(YaccGrammarError {
kind: YaccGrammarErrorKind::InvalidActionKind,
spans: vec![*ak_span],
});
return Err(errs);
}
}
}
}
Ok(i)
}
pub(crate) fn build(self) -> (Option<YaccKind>, GrammarAST) {
(self.yacc_kind, self.ast)
}
fn parse_declarations(
&mut self,
mut i: usize,
errs: &mut Vec<YaccGrammarError>,
) -> Result<usize, YaccGrammarError> {
i = self.parse_ws(i, true)?;
let mut prec_level = 0;
while i < self.src.len() {
if self.lookahead_is("%%", i).is_some() {
return Ok(i);
}
if let Some(j) = self.lookahead_is("%token", i) {
i = self.parse_ws(j, false)?;
while i < self.src.len() && self.lookahead_is("%", i).is_none() {
let (j, n, span) = self.parse_token(i)?;
if self.ast.tokens.insert(n) {
self.ast.spans.push(span);
}
i = self.parse_ws(j, true)?;
}
continue;
}
if let Some(YaccKind::Original(_)) = self.yacc_kind {
if let Some(j) = self.lookahead_is("%actiontype", i) {
i = self.parse_ws(j, false)?;
let (j, n) = self.parse_to_eol(i)?;
let span = Span::new(i, j);
if let Some((_, orig_span)) = self.global_actiontype {
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateActiontypeDeclaration,
orig_span,
span,
);
} else {
self.global_actiontype = Some((n, span));
}
i = self.parse_ws(j, true)?;
continue;
}
}
if let Some(j) = self.lookahead_is("%start", i) {
i = self.parse_ws(j, false)?;
let (j, n) = self.parse_name(i)?;
let span = Span::new(i, j);
if let Some((_, orig_span)) = self.ast.start {
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateStartDeclaration,
orig_span,
span,
);
} else {
self.ast.start = Some((n, span));
}
i = self.parse_ws(j, true)?;
continue;
}
if let Some(j) = self.lookahead_is("%epp", i) {
i = self.parse_ws(j, false)?;
let (j, n, _) = self.parse_token(i)?;
let span = Span::new(i, j);
i = self.parse_ws(j, false)?;
let (j, v) = self.parse_string(i)?;
let vspan = Span::new(i, j);
match self.ast.epp.entry(n) {
Entry::Occupied(orig) => {
let (orig_span, _) = orig.get();
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateEPP,
*orig_span,
span,
)
}
Entry::Vacant(epp) => {
epp.insert((span, (v, vspan)));
}
}
i = self.parse_ws(j, true)?;
continue;
}
if let Some(j) = self.lookahead_is("%expect-rr", i) {
i = self.parse_ws(j, false)?;
let (j, n) = self.parse_int(i)?;
let span = Span::new(i, j);
if let Some((_, orig_span)) = self.ast.expectrr {
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateExpectRRDeclaration,
orig_span,
span,
);
} else {
self.ast.expectrr = Some((n, span));
}
i = self.parse_ws(j, true)?;
continue;
}
if let Some(j) = self.lookahead_is("%expect-unused", i) {
i = self.parse_ws(j, false)?;
while i < self.src.len() && self.lookahead_is("%", i).is_none() {
let j = match self.parse_name(i) {
Ok((j, n)) => {
self.ast
.expect_unused
.push(Symbol::Rule(n, Span::new(i, j)));
j
}
Err(_) => match self.parse_token(i) {
Ok((j, n, span)) => {
self.ast.expect_unused.push(Symbol::Token(n, span));
j
}
Err(_) => {
return Err(self.mk_error(YaccGrammarErrorKind::UnknownSymbol, i))
}
},
};
i = self.parse_ws(j, true)?;
}
continue;
}
if let Some(j) = self.lookahead_is("%expect", i) {
i = self.parse_ws(j, false)?;
let (j, n) = self.parse_int(i)?;
let span = Span::new(i, j);
if let Some((_, orig_span)) = self.ast.expect {
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateExpectDeclaration,
orig_span,
span,
);
} else {
self.ast.expect = Some((n, span));
}
i = self.parse_ws(j, true)?;
continue;
}
if let Some(j) = self.lookahead_is("%avoid_insert", i) {
i = self.parse_ws(j, false)?;
let num_newlines = self.num_newlines;
if self.ast.avoid_insert.is_none() {
self.ast.avoid_insert = Some(HashMap::new());
}
while j < self.src.len() && self.num_newlines == num_newlines {
let (j, n, span) = self.parse_token(i)?;
if self.ast.tokens.insert(n.clone()) {
self.ast.spans.push(span);
}
match self.ast.avoid_insert.as_mut().unwrap().entry(n) {
Entry::Occupied(occupied) => {
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration,
*occupied.get(),
span,
);
}
Entry::Vacant(vacant) => {
vacant.insert(span);
}
}
i = self.parse_ws(j, true)?;
}
continue;
}
if let Some(j) = self.lookahead_is("%parse-param", i) {
i = self.parse_ws(j, false)?;
let (j, name) = self.parse_to_single_colon(i)?;
match self.lookahead_is(":", j) {
Some(j) => i = self.parse_ws(j, false)?,
None => {
return Err(self.mk_error(YaccGrammarErrorKind::MissingColon, j));
}
}
let (j, ty) = self.parse_to_eol(i)?;
self.ast.parse_param = Some((name, ty));
i = self.parse_ws(j, true)?;
continue;
}
if let Some(YaccKind::Eco) = self.yacc_kind {
if let Some(j) = self.lookahead_is("%implicit_tokens", i) {
i = self.parse_ws(j, false)?;
let num_newlines = self.num_newlines;
if self.ast.implicit_tokens.is_none() {
self.ast.implicit_tokens = Some(HashMap::new());
}
while j < self.src.len() && self.num_newlines == num_newlines {
let (j, n, span) = self.parse_token(i)?;
if self.ast.tokens.insert(n.clone()) {
self.ast.spans.push(span);
}
match self.ast.implicit_tokens.as_mut().unwrap().entry(n) {
Entry::Occupied(entry) => {
let orig_span = *entry.get();
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration,
orig_span,
span,
);
}
Entry::Vacant(entry) => {
entry.insert(span);
}
}
i = self.parse_ws(j, true)?;
}
continue;
}
}
{
let k;
let kind;
if let Some(j) = self.lookahead_is("%left", i) {
kind = AssocKind::Left;
k = j;
} else if let Some(j) = self.lookahead_is("%right", i) {
kind = AssocKind::Right;
k = j;
} else if let Some(j) = self.lookahead_is("%nonassoc", i) {
kind = AssocKind::Nonassoc;
k = j;
} else {
return Err(self.mk_error(YaccGrammarErrorKind::UnknownDeclaration, i));
}
i = self.parse_ws(k, false)?;
let num_newlines = self.num_newlines;
while i < self.src.len() && num_newlines == self.num_newlines {
let (j, n, span) = self.parse_token(i)?;
match self.ast.precs.entry(n) {
Entry::Occupied(orig) => {
let (_, orig_span) = orig.get();
add_duplicate_occurrence(
errs,
YaccGrammarErrorKind::DuplicatePrecedence,
*orig_span,
span,
);
}
Entry::Vacant(entry) => {
let prec = Precedence {
level: prec_level,
kind,
};
entry.insert((prec, span));
}
}
i = self.parse_ws(j, true)?;
}
prec_level += 1;
}
}
debug_assert!(i == self.src.len());
Err(self.mk_error(YaccGrammarErrorKind::PrematureEnd, i))
}
fn parse_rules(&mut self, mut i: usize) -> Result<usize, YaccGrammarError> {
i = self.lookahead_is("%%", i).unwrap();
i = self.parse_ws(i, true)?;
while i < self.src.len() && self.lookahead_is("%%", i).is_none() {
i = self.parse_rule(i)?;
i = self.parse_ws(i, true)?;
}
Ok(i)
}
fn parse_rule(&mut self, mut i: usize) -> Result<usize, YaccGrammarError> {
let (j, rn) = self.parse_name(i)?;
let span = Span::new(i, j);
if self.ast.start.is_none() {
self.ast.start = Some((rn.clone(), span));
}
match self.yacc_kind {
None => unreachable!("Concrete YaccKind resolved at this point"),
Some(YaccKind::Original(_)) | Some(YaccKind::Eco) => {
if self.ast.get_rule(&rn).is_none() {
self.ast.add_rule(
(rn.clone(), span),
self.global_actiontype.clone().map(|(s, _)| s),
);
}
i = j;
}
Some(YaccKind::Grmtools) => {
i = self.parse_ws(j, true)?;
if let Some(j) = self.lookahead_is("->", i) {
i = j;
} else {
return Err(self.mk_error(YaccGrammarErrorKind::MissingRightArrow, i));
}
i = self.parse_ws(i, true)?;
let (j, actiont) = self.parse_to_single_colon(i)?;
if self.ast.get_rule(&rn).is_none() {
self.ast.add_rule((rn.clone(), span), Some(actiont));
}
i = j;
}
}
i = self.parse_ws(i, true)?;
match self.lookahead_is(":", i) {
Some(j) => i = j,
None => {
return Err(self.mk_error(YaccGrammarErrorKind::MissingColon, i));
}
}
let mut syms = Vec::new();
let mut prec = None;
let mut action = None;
i = self.parse_ws(i, true)?;
let mut pos_prod_start = i;
let mut pos_prod_end = None;
while i < self.src.len() {
if let Some(j) = self.lookahead_is("|", i) {
self.ast.add_prod(
rn.clone(),
syms,
prec,
action,
Span::new(pos_prod_start, pos_prod_end.take().unwrap_or(i)),
);
syms = Vec::new();
prec = None;
action = None;
i = self.parse_ws(j, true)?;
pos_prod_start = i;
continue;
} else if let Some(j) = self.lookahead_is(";", i) {
self.ast.add_prod(
rn,
syms,
prec,
action,
Span::new(pos_prod_start, pos_prod_end.take().unwrap_or(i)),
);
return Ok(j);
}
if self.lookahead_is("\"", i).is_some() || self.lookahead_is("'", i).is_some() {
let (j, sym, span) = self.parse_token(i)?;
pos_prod_end = Some(j);
i = self.parse_ws(j, true)?;
if self.ast.tokens.insert(sym.clone()) {
self.ast.spans.push(span);
}
syms.push(Symbol::Token(sym, span));
} else if let Some(j) = self.lookahead_is("%prec", i) {
i = self.parse_ws(j, true)?;
let (k, sym, span) = self.parse_token(i)?;
if self.ast.tokens.insert(sym.clone()) {
self.ast.spans.push(span);
}
prec = Some(sym);
pos_prod_end = Some(k);
i = k;
} else if self.lookahead_is("{", i).is_some() {
pos_prod_end = Some(i);
let (j, a) = self.parse_action(i)?;
i = self.parse_ws(j, true)?;
action = Some(a);
if !(self.lookahead_is("|", i).is_some() || self.lookahead_is(";", i).is_some()) {
return Err(self.mk_error(YaccGrammarErrorKind::ProductionNotTerminated, i));
}
} else if let Some(j) = self.lookahead_is("%empty", i) {
let k = self.parse_ws(j, true)?;
if !syms.is_empty()
| !(self.lookahead_is("|", k).is_some()
|| self.lookahead_is(";", k).is_some()
|| self.lookahead_is("{", k).is_some()
|| self.lookahead_is("%prec", k).is_some())
{
return Err(self.mk_error(YaccGrammarErrorKind::NonEmptyProduction, i));
}
pos_prod_end = Some(j);
i = k;
} else {
let (j, sym, span) = self.parse_token(i)?;
pos_prod_end = Some(j);
if self.ast.tokens.contains(&sym) {
syms.push(Symbol::Token(sym, span));
} else {
syms.push(Symbol::Rule(sym, span));
}
i = j;
}
i = self.parse_ws(i, true)?;
}
Err(self.mk_error(YaccGrammarErrorKind::IncompleteRule, i))
}
fn parse_name(&self, i: usize) -> Result<(usize, String), YaccGrammarError> {
match RE_NAME.find(&self.src[i..]) {
Some(m) => {
assert_eq!(m.start(), 0);
Ok((i + m.end(), self.src[i..i + m.end()].to_string()))
}
None => Err(self.mk_error(YaccGrammarErrorKind::IllegalName, i)),
}
}
fn parse_token(&self, i: usize) -> Result<(usize, String, Span), YaccGrammarError> {
match RE_TOKEN.find(&self.src[i..]) {
Some(m) => {
assert!(m.start() == 0 && m.end() > 0);
match self.src[i..].chars().next().unwrap() {
'"' | '\'' => {
debug_assert!('"'.len_utf8() == 1 && '\''.len_utf8() == 1);
let start_cidx = i + 1;
let end_cidx = i + m.end() - 1;
Ok((
i + m.end(),
self.src[start_cidx..end_cidx].to_string(),
Span::new(start_cidx, end_cidx),
))
}
_ => Ok((
i + m.end(),
self.src[i..i + m.end()].to_string(),
Span::new(i, i + m.end()),
)),
}
}
None => Err(self.mk_error(YaccGrammarErrorKind::IllegalString, i)),
}
}
fn parse_action(&mut self, i: usize) -> Result<(usize, String), YaccGrammarError> {
debug_assert!(self.lookahead_is("{", i).is_some());
let mut j = i;
let mut c = 0; while j < self.src.len() {
let ch = self.src[j..].chars().next().unwrap();
match ch {
'{' => c += 1,
'}' if c == 1 => {
c = 0;
break;
}
'}' => c -= 1,
'\n' | '\r' => {
self.num_newlines += 1;
}
_ => (),
};
j += ch.len_utf8();
}
if c > 0 {
Err(self.mk_error(YaccGrammarErrorKind::IncompleteAction, i))
} else {
debug_assert!(self.lookahead_is("}", j).is_some());
let s = self.src[i + '{'.len_utf8()..j].trim().to_string();
Ok((j + '}'.len_utf8(), s))
}
}
fn parse_programs(
&mut self,
mut i: usize,
_: &mut Vec<YaccGrammarError>,
) -> Result<usize, YaccGrammarError> {
if let Some(j) = self.lookahead_is("%%", i) {
i = self.parse_ws(j, true)?;
let prog = self.src[i..].to_string();
i += prog.len();
self.ast.set_programs(prog);
}
Ok(i)
}
fn parse_to_eol(&mut self, i: usize) -> Result<(usize, String), YaccGrammarError> {
let mut j = i;
while j < self.src.len() {
let c = self.src[j..].chars().next().unwrap();
match c {
'\n' | '\r' => break,
_ => j += c.len_utf8(),
}
}
Ok((j, self.src[i..j].to_string()))
}
fn parse_to_single_colon(&mut self, i: usize) -> Result<(usize, String), YaccGrammarError> {
let mut j = i;
while j < self.src.len() {
let c = self.src[j..].chars().next().unwrap();
match c {
':' => {
let k = j + ':'.len_utf8();
if k == self.src.len() || !self.src[k..].starts_with(':') {
return Ok((j, self.src[i..j].trim().to_string()));
}
j += 2 * ':'.len_utf8();
}
'\n' | '\r' => {
self.num_newlines += 1;
j += c.len_utf8();
}
_ => j += c.len_utf8(),
}
}
Err(self.mk_error(YaccGrammarErrorKind::ReachedEOL, j))
}
fn parse_int<T: FromStr + PrimInt>(
&mut self,
i: usize,
) -> Result<(usize, T), YaccGrammarError> {
let mut j = i;
while j < self.src.len() {
let c = self.src[j..].chars().next().unwrap();
match c {
'0' | '1' | '2' | '3' | '4' | '5' | '6' | '7' | '8' | '9' => j += 1,
_ => break,
}
}
match self.src[i..j].parse::<T>() {
Ok(x) => Ok((j, x)),
Err(_) => Err(self.mk_error(YaccGrammarErrorKind::IllegalInteger, i)),
}
}
fn parse_string(&mut self, mut i: usize) -> Result<(usize, String), YaccGrammarError> {
let qc = if self.lookahead_is("'", i).is_some() {
'\''
} else if self.lookahead_is("\"", i).is_some() {
'"'
} else {
return Err(self.mk_error(YaccGrammarErrorKind::InvalidString, i));
};
debug_assert!('"'.len_utf8() == 1 && '\''.len_utf8() == 1);
let mut s = String::new();
i += 1;
let mut j = i;
while j < self.src.len() {
let c = self.src[j..].chars().next().unwrap();
match c {
'\n' | '\r' => {
return Err(self.mk_error(YaccGrammarErrorKind::InvalidString, j));
}
x if x == qc => {
s.push_str(&self.src[i..j]);
return Ok((j + 1, s));
}
'\\' => {
debug_assert!('\\'.len_utf8() == 1);
match self.src[j + 1..].chars().next() {
Some(c) if c == '\'' || c == '"' => {
s.push_str(&self.src[i..j]);
i = j + 1;
j += 2;
}
_ => {
return Err(self.mk_error(YaccGrammarErrorKind::InvalidString, j));
}
}
}
_ => j += c.len_utf8(),
}
}
Err(self.mk_error(YaccGrammarErrorKind::InvalidString, j))
}
fn parse_ws(&mut self, mut i: usize, inc_newlines: bool) -> Result<usize, YaccGrammarError> {
while i < self.src.len() {
let c = self.src[i..].chars().next().unwrap();
match c {
' ' | '\t' => i += c.len_utf8(),
'\n' | '\r' => {
if !inc_newlines {
return Err(self.mk_error(YaccGrammarErrorKind::ReachedEOL, i));
}
self.num_newlines += 1;
i += c.len_utf8();
}
'/' => {
if i + c.len_utf8() == self.src.len() {
break;
} else {
let j = i + c.len_utf8();
let c = self.src[j..].chars().next().unwrap();
match c {
'/' => {
i = j + c.len_utf8();
for c in self.src[i..].chars() {
i += c.len_utf8();
if c == '\n' || c == '\r' {
self.num_newlines += 1;
break;
}
}
}
'*' => {
let mut k = j + c.len_utf8();
let mut found = false;
while k < self.src.len() {
let c = self.src[k..].chars().next().unwrap();
k += c.len_utf8();
match c {
'\n' | '\r' => {
if !inc_newlines {
return Err(self.mk_error(
YaccGrammarErrorKind::ReachedEOL,
i,
));
}
self.num_newlines += 1;
}
'*' => (),
_ => continue,
}
if k < self.src.len() {
let c = self.src[k..].chars().next().unwrap();
if c == '/' {
i = k + c.len_utf8();
found = true;
break;
}
}
}
if !found {
return Err(
self.mk_error(YaccGrammarErrorKind::IncompleteComment, i)
);
}
}
_ => break,
}
}
}
_ => break,
}
}
Ok(i)
}
fn lookahead_is(&self, s: &'static str, i: usize) -> Option<usize> {
if self.src[i..].starts_with(s) {
Some(i + s.len())
} else {
None
}
}
fn mk_error(&self, k: YaccGrammarErrorKind, off: usize) -> YaccGrammarError {
let span = Span::new(off, off);
YaccGrammarError {
kind: k,
spans: vec![span],
}
}
}
#[cfg(test)]
mod test {
use super::{
super::{
ast::{GrammarAST, Production, Symbol},
AssocKind, Precedence, YaccKind, YaccKindResolver, YaccOriginalActionKind,
},
Span, Spanned, YaccGrammarError, YaccGrammarErrorKind, YaccParser,
};
use std::collections::HashSet;
fn parse(yacc_kind: YaccKind, s: &str) -> Result<GrammarAST, Vec<YaccGrammarError>> {
let mut yp = YaccParser::new(YaccKindResolver::Force(yacc_kind), s.to_string());
yp.parse()?;
Ok(yp.build().1)
}
fn rule(n: &str) -> Symbol {
Symbol::Rule(n.to_string(), Span::new(0, 0))
}
fn rule_span(n: &str, span: Span) -> Symbol {
Symbol::Rule(n.to_string(), span)
}
fn token(n: &str) -> Symbol {
Symbol::Token(n.to_string(), Span::new(0, 0))
}
fn token_span(n: &str, span: Span) -> Symbol {
Symbol::Token(n.to_string(), span)
}
fn line_of_offset(s: &str, off: usize) -> usize {
s[..off].lines().count()
}
macro_rules! line_col {
($src:ident, $span: expr) => {{
let mut line_cache = crate::newlinecache::NewlineCache::new();
line_cache.feed(&$src);
line_cache
.byte_to_line_num_and_col_num(&$src, $span.start())
.unwrap()
}};
}
trait ErrorsHelper {
fn expect_error_at_line(self, src: &str, kind: YaccGrammarErrorKind, line: usize);
fn expect_error_at_line_col(
self,
src: &str,
kind: YaccGrammarErrorKind,
line: usize,
col: usize,
);
fn expect_error_at_lines_cols(
self,
src: &str,
kind: YaccGrammarErrorKind,
lines_cols: &mut dyn Iterator<Item = (usize, usize)>,
);
fn expect_multiple_errors(
self,
src: &str,
expected: &mut dyn Iterator<Item = (YaccGrammarErrorKind, Vec<(usize, usize)>)>,
);
}
impl ErrorsHelper for Result<GrammarAST, Vec<YaccGrammarError>> {
#[track_caller]
fn expect_error_at_line(self, src: &str, kind: YaccGrammarErrorKind, line: usize) {
let errs = self
.as_ref()
.map_err(Vec::as_slice)
.expect_err("Parsed ok while expecting error");
assert_eq!(errs.len(), 1);
let e = &errs[0];
assert_eq!(e.kind, kind);
assert_eq!(line_of_offset(src, e.spans()[0].start()), line);
assert_eq!(e.spans.len(), 1);
}
#[track_caller]
fn expect_error_at_line_col(
self,
src: &str,
kind: YaccGrammarErrorKind,
line: usize,
col: usize,
) {
self.expect_error_at_lines_cols(src, kind, &mut std::iter::once((line, col)))
}
#[track_caller]
fn expect_error_at_lines_cols(
self,
src: &str,
kind: YaccGrammarErrorKind,
lines_cols: &mut dyn Iterator<Item = (usize, usize)>,
) {
let errs = self
.as_ref()
.map_err(Vec::as_slice)
.expect_err("Parsed ok while expecting error");
assert_eq!(errs.len(), 1);
let e = &errs[0];
assert_eq!(e.kind, kind);
assert_eq!(
e.spans()
.iter()
.map(|span| line_col!(src, span))
.collect::<Vec<(usize, usize)>>(),
lines_cols.collect::<Vec<(usize, usize)>>()
);
for span in e.spans() {
let _ = &src[span.start()..span.end()];
}
}
#[track_caller]
fn expect_multiple_errors(
self,
src: &str,
expected: &mut dyn Iterator<Item = (YaccGrammarErrorKind, Vec<(usize, usize)>)>,
) {
let errs = self.expect_err("Parsed ok while expecting error");
for e in &errs {
for span in e.spans() {
let _ = &src[span.start()..span.end()];
}
}
assert_eq!(
errs.iter()
.map(|e| {
(
e.kind.clone(),
e.spans()
.iter()
.map(|span| line_col!(src, span))
.collect::<Vec<_>>(),
)
})
.collect::<Vec<_>>(),
expected.collect::<Vec<_>>()
);
}
}
#[test]
fn test_helper_fn() {
assert_eq!(Symbol::Token("A".to_string(), Span::new(0, 0)), token("A"));
}
#[test]
fn test_symbol_eq() {
assert_eq!(rule("A"), rule("A"));
assert_ne!(rule("A"), rule("B"));
assert_ne!(rule("A"), token("A"));
}
#[test]
fn test_rule() {
let src = "
%%
A : 'a';
"
.to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert_eq!(grm.get_rule("A").unwrap().pidxs, vec![0]);
let a_span = Span::new(33, 34);
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[0]],
Production {
symbols: vec![token_span("a", a_span)],
precedence: None,
action: None,
prod_span: Span::new(32, 35),
}
);
assert_eq!(&src[a_span.start()..a_span.end()], "a");
}
#[test]
fn test_rule_production_simple() {
let src = "
%%
A : 'a';
A : 'b';
"
.to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
let a_span = Span::new(33, 34);
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[0]],
Production {
symbols: vec![token_span("a", a_span)],
precedence: None,
action: None,
prod_span: Span::new(32, 35),
}
);
assert_eq!(&src[a_span.start()..a_span.end()], "a");
let b_span = Span::new(54, 55);
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[1]],
Production {
symbols: vec![token_span("b", Span::new(54, 55))],
precedence: None,
action: None,
prod_span: Span::new(53, 56),
}
);
assert_eq!(&src[b_span.start()..b_span.end()], "b");
}
#[test]
fn test_rule_empty() {
let src = "
%%
A : ;
B : 'b' | ;
C : | 'c';
"
.to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[0]],
Production {
symbols: vec![],
precedence: None,
action: None,
prod_span: Span::new(32, 32),
}
);
let b_span = Span::new(51, 52);
assert_eq!(
grm.prods[grm.get_rule("B").unwrap().pidxs[0]],
Production {
symbols: vec![token_span("b", b_span)],
precedence: None,
action: None,
prod_span: Span::new(50, 53),
}
);
assert_eq!(&src[b_span.start()..b_span.end()], "b");
assert_eq!(
grm.prods[grm.get_rule("B").unwrap().pidxs[1]],
Production {
symbols: vec![],
precedence: None,
action: None,
prod_span: Span::new(56, 56),
}
);
assert_eq!(
grm.prods[grm.get_rule("C").unwrap().pidxs[0]],
Production {
symbols: vec![],
precedence: None,
action: None,
prod_span: Span::new(74, 74),
}
);
let c_span = Span::new(77, 78);
assert_eq!(
grm.prods[grm.get_rule("C").unwrap().pidxs[1]],
Production {
symbols: vec![token_span("c", c_span)],
precedence: None,
action: None,
prod_span: Span::new(76, 79),
}
);
assert_eq!(&src[c_span.start()..c_span.end()], "c");
}
#[test]
fn test_empty_program() {
let src = "%%\nA : 'a';\n%%".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
}
#[test]
fn test_multiple_symbols() {
let src = "%%\nA : 'a' B;".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
let a_span = Span::new(8, 9);
let b_span = Span::new(11, 12);
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[0]],
Production {
symbols: vec![token_span("a", a_span), rule_span("B", b_span)],
precedence: None,
action: None,
prod_span: Span::new(7, 12),
}
);
assert_eq!(&src[a_span.start()..a_span.end()], "a");
assert_eq!(&src[b_span.start()..b_span.end()], "B");
}
#[test]
fn test_token_types() {
let src = "%%\nA : 'a' \"b\";".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
let a_span = Span::new(8, 9);
let b_span = Span::new(12, 13);
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[0]],
Production {
symbols: vec![token_span("a", a_span), token_span("b", b_span)],
precedence: None,
action: None,
prod_span: Span::new(7, 14),
}
);
assert_eq!(&src[a_span.start()..a_span.end()], "a");
assert_eq!(&src[b_span.start()..b_span.end()], "b");
}
#[test]
fn test_declaration_start() {
let src = "%start A\n%%\nA : a;".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert_eq!(grm.start.unwrap(), ("A".to_string(), Span::new(9, 10)));
}
#[test]
fn test_declaration_token() {
let src = "%token a\n%%\nA : a;".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert!(grm.has_token("a"));
}
#[test]
fn test_declaration_token_literal() {
let src = "%token 'a'\n%%\nA : 'a';".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert!(grm.has_token("a"));
}
#[test]
fn test_declaration_tokens() {
let src = "%token a b c 'd'\n%%\nA : a;".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert!(grm.has_token("a"));
assert!(grm.has_token("b"));
assert!(grm.has_token("c"));
}
#[test]
fn test_auto_add_tokens() {
let src = "%%\nA : 'a';".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert!(grm.has_token("a"));
}
#[test]
fn test_token_non_literal() {
let src = "%token T %%\nA : T;".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert!(grm.has_token("T"));
let t_span = Span::new(16, 17);
assert_eq!(
grm.prods[grm.get_rule("A").unwrap().pidxs[0]],
Production {
symbols: vec![token_span("T", t_span)],
precedence: None,
action: None,
prod_span: t_span,
}
);
assert_eq!(&src[t_span.start()..t_span.end() + 1], "T;");
}
#[test]
fn test_token_unicode() {
let src = "%token '❤' %%\nA : '❤';".to_string();
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.unwrap();
assert!(grm.has_token("❤"));
}
#[test]
fn test_unicode_err1() {
let src = "%token '❤' ❤;".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::IllegalString, 1, 12);
}
#[test]
fn test_unicode_err2() {
let src = "%token '❤'\n%%\nA : '❤' | ❤;".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::IllegalString, 3, 11);
}
#[test]
fn test_missing_end_quote() {
let src = "%epp X \"f\\".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::InvalidString, 1, 10);
}
#[test]
fn test_simple_decl_fail() {
let src = "%fail x\n%%\nA : a".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::UnknownDeclaration, 1, 1);
}
#[test]
fn test_empty() {
let src = "".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col("", YaccGrammarErrorKind::PrematureEnd, 1, 1);
}
#[test]
fn test_incomplete_rule1() {
let src = "%%A:".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::IncompleteRule, 1, 5);
}
#[test]
fn test_line_col_report1() {
let src = "%%
A:"
.to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::IncompleteRule, 2, 3);
}
#[test]
fn test_line_col_report2() {
let src = "%%
A:
"
.to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::IncompleteRule, 3, 1);
}
#[test]
fn test_line_col_report3() {
let src = "
%woo"
.to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::UnknownDeclaration, 3, 9);
}
#[test]
fn test_missing_colon() {
let src = "%%A x;".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::MissingColon, 1, 5);
}
#[test]
fn test_premature_end() {
let src = "%token x".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::PrematureEnd, 1, 9);
}
#[test]
fn test_premature_end_multibyte() {
let src = "%actiontype 🦀".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::PrematureEnd, 1, 14);
let src = "%parse-param c:🦀".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::PrematureEnd, 1, 17);
let src = "// 🦀".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::PrematureEnd, 1, 5);
}
#[test]
fn test_same_line() {
let src = "%token
x"
.to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::ReachedEOL, 1, 7);
}
#[test]
fn test_unknown_declaration() {
let src = "%woo".to_string();
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
&src,
)
.expect_error_at_line_col(&src, YaccGrammarErrorKind::UnknownDeclaration, 1, 1);
}
#[test]
fn test_grmtools_format() {
let src = "
%start A
%%
A -> T: 'b';
B -> Result<(), T>: 'c';
C -> ::std::result::Result<(), T>: 'd';
"
.to_string();
let grm = parse(YaccKind::Grmtools, &src).unwrap();
assert_eq!(grm.rules["A"].actiont, Some("T".to_string()));
assert_eq!(grm.rules["B"].actiont, Some("Result<(), T>".to_string()));
assert_eq!(
grm.rules["C"].actiont,
Some("::std::result::Result<(), T>".to_string())
);
}
#[test]
#[rustfmt::skip]
fn test_precs() {
let src = "
%left '+' '-'
%left '*'
%right '/'
%right '^'
%nonassoc '~'
%%
".to_string();
let grm = parse(YaccKind::Original(YaccOriginalActionKind::GenericParseTree), &src).unwrap();
assert_eq!(grm.precs.len(), 6);
assert_eq!(grm.precs["+"], (Precedence{level: 0, kind: AssocKind::Left}, Span::new(18, 19)));
assert_eq!(grm.precs["-"], (Precedence{level: 0, kind: AssocKind::Left}, Span::new(22, 23)));
assert_eq!(grm.precs["*"], (Precedence{level: 1, kind: AssocKind::Left}, Span::new(42, 43)));
assert_eq!(grm.precs["/"], (Precedence{level: 2, kind: AssocKind::Right}, Span::new(63, 64)));
assert_eq!(grm.precs["^"], (Precedence{level: 3, kind: AssocKind::Right}, Span::new(84, 85)));
assert_eq!(grm.precs["~"], (Precedence{level: 4, kind: AssocKind::Nonassoc}, Span::new(108, 109)));
}
#[test]
fn test_dup_precs() {
#[rustfmt::skip]
let srcs = vec![
("
%left 'x'
%left 'x'
%%
", ((2, 18), (3, 18))),
("
%left 'x'
%right 'x'
%%
", ((2, 18), (3, 19))),
("
%right 'x'
%right 'x'
%%
", ((2, 19), (3, 19))),
("
%nonassoc 'x'
%nonassoc 'x'
%%
", ((2, 22), (3, 22))),
("
%left 'x'
%nonassoc 'x'
%%
", ((2, 18), (3, 22))),
("
%right 'x'
%nonassoc 'x'
%%
", ((2, 19), (3, 22)))
];
for (src, (expected_origin, expected_dup)) in srcs.iter() {
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicatePrecedence,
&mut [*expected_origin, *expected_dup].into_iter(),
);
}
}
#[test]
fn test_multiple_dup_precs() {
let src = "
%left 'x'
%left 'x'
%right 'x'
%nonassoc 'x'
%left 'y'
%nonassoc 'y'
%right 'y'
%%";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicatePrecedence,
vec![(2, 18), (3, 18), (4, 19), (5, 22)],
),
(
YaccGrammarErrorKind::DuplicatePrecedence,
vec![(6, 18), (7, 22), (8, 19)],
),
]
.into_iter(),
);
}
#[test]
#[rustfmt::skip]
fn test_prec_override() {
let src = "
%left '+' '-'
%left '*' '/'
%%
expr : expr '+' expr
| expr '-' expr
| expr '*' expr
| expr '/' expr
| '-' expr %prec '*'
| NAME ;
";
let grm = parse(YaccKind::Original(YaccOriginalActionKind::GenericParseTree), src).unwrap();
assert_eq!(grm.precs.len(), 4);
assert_eq!(grm.prods[grm.rules["expr"].pidxs[0]].precedence, None);
assert_eq!(grm.prods[grm.rules["expr"].pidxs[3]].symbols.len(), 3);
assert_eq!(grm.prods[grm.rules["expr"].pidxs[4]].symbols.len(), 2);
assert_eq!(grm.prods[grm.rules["expr"].pidxs[4]].precedence, Some("*".to_string()));
}
#[test]
fn test_prec_empty() {
let src = "
%%
expr : 'a'
| %empty %prec 'a';
";
let grm = parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).unwrap();
assert_eq!(
grm.prods[grm.rules["expr"].pidxs[1]].precedence,
Some("a".to_string())
);
}
#[test]
fn test_bad_prec_overrides() {
let src = "
%%
S: 'A' %prec ;
";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_line(src, YaccGrammarErrorKind::IllegalString, 3);
}
#[test]
fn test_parse_avoid_insert() {
let ast = parse(
YaccKind::Eco,
"
%avoid_insert ws1 ws2
%start R
%%
R: 'a';
",
)
.unwrap();
assert_eq!(
ast.avoid_insert,
Some(
[
("ws1".to_string(), Span::new(25, 28)),
("ws2".to_string(), Span::new(29, 32))
]
.iter()
.cloned()
.collect()
)
);
assert!(ast.tokens.get("ws1").is_some());
assert!(ast.tokens.get("ws2").is_some());
}
#[test]
fn test_multiple_avoid_insert() {
let ast = parse(
YaccKind::Eco,
"
%avoid_insert X
%avoid_insert Y
%%
",
)
.unwrap();
assert_eq!(
ast.avoid_insert,
Some(
[
("X".to_string(), Span::new(25, 26)),
("Y".to_string(), Span::new(51, 52))
]
.iter()
.cloned()
.collect()
)
);
}
#[test]
fn test_duplicate_avoid_insert() {
let src = "
%avoid_insert X Y
%avoid_insert Y
%%
";
parse(YaccKind::Eco, src).expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration,
&mut [(2usize, 27usize), (3, 25)].into_iter(),
);
}
#[test]
fn test_duplicate_avoid_insert2() {
let src = "
%avoid_insert X
%avoid_insert Y Y
%%
";
parse(YaccKind::Eco, src).expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration,
&mut [(3, 23), (3, 25)].into_iter(),
);
}
#[test]
fn test_multiple_duplicate_avoid_insert() {
let src = "
%avoid_insert X
%avoid_insert Y Y X
%%
";
parse(YaccKind::Eco, src).expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration,
vec![(3, 23), (3, 25)],
),
(
YaccGrammarErrorKind::DuplicateAvoidInsertDeclaration,
vec![(2, 23), (3, 27)],
),
]
.into_iter(),
);
}
#[test]
fn test_no_implicit_tokens_in_original_yacc() {
let src = "
%implicit_tokens X
%%
";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_line(src, YaccGrammarErrorKind::UnknownDeclaration, 2);
}
#[test]
fn test_parse_implicit_tokens() {
let ast = parse(
YaccKind::Eco,
"
%implicit_tokens ws1 ws2
%start R
%%
R: 'a';
",
)
.unwrap();
assert_eq!(
ast.implicit_tokens,
Some(
[
("ws1".to_string(), Span::new(28, 31)),
("ws2".to_string(), Span::new(32, 35))
]
.iter()
.cloned()
.collect()
)
);
assert!(ast.tokens.get("ws1").is_some());
assert!(ast.tokens.get("ws2").is_some());
}
#[test]
fn test_multiple_implicit_tokens() {
let ast = parse(
YaccKind::Eco,
"
%implicit_tokens X
%implicit_tokens Y
%%
",
)
.unwrap();
assert_eq!(
ast.implicit_tokens,
Some(
[
("X".to_string(), Span::new(28, 29)),
("Y".to_string(), Span::new(57, 58))
]
.iter()
.cloned()
.collect()
)
);
}
#[test]
fn test_duplicate_implicit_tokens() {
let src = "
%implicit_tokens X
%implicit_tokens X Y
%%
";
parse(YaccKind::Eco, src).expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration,
&mut [(2, 26), (3, 26)].into_iter(),
);
}
#[test]
fn test_duplicate_implicit_tokens2() {
let src = "
%implicit_tokens X X
%implicit_tokens Y
%%
";
parse(YaccKind::Eco, src).expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration,
&mut [(2, 26), (2, 28)].into_iter(),
);
}
#[test]
fn test_multiple_duplicate_implicit_tokens_and_invalid_rule() {
let src = "
%implicit_tokens X
%implicit_tokens X Y
%implicit_tokens Y
%%
IncompleteRule: ";
parse(YaccKind::Eco, src).expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration,
vec![(2, 26), (3, 26)],
),
(
YaccGrammarErrorKind::DuplicateImplicitTokensDeclaration,
vec![(3, 28), (4, 26)],
),
(YaccGrammarErrorKind::IncompleteRule, vec![(6, 25)]),
]
.into_iter(),
);
}
#[test]
#[rustfmt::skip]
fn test_parse_epp() {
let ast = parse(
YaccKind::Eco,
r#"
%epp A "a"
%epp B 'a'
%epp C '"'
%epp D "'"
%epp E "\""
%epp F '\''
%epp G "a\"b"
%%
R: 'A';
"#,
)
.unwrap();
assert_eq!(ast.epp.len(), 7);
assert_eq!(ast.epp["A"], (Span::new(16, 17), ("a".to_string(), Span::new(18, 21))));
assert_eq!(ast.epp["B"], (Span::new(37, 38), ("a".to_string(), Span::new(39, 42))));
assert_eq!(ast.epp["C"], (Span::new(58, 59), ("\"".to_string(), Span::new(60, 63))));
assert_eq!(ast.epp["D"], (Span::new(79, 80), ("'".to_string(), Span::new(81, 84))));
assert_eq!(ast.epp["E"], (Span::new(100, 101), ("\"".to_string(), Span::new(102, 106))));
assert_eq!(ast.epp["F"], (Span::new(122, 123), ("'".to_string(), Span::new(124, 128))));
assert_eq!(ast.epp["G"], (Span::new(144, 145), ("a\"b".to_string(),Span::new(146, 152))));
}
#[test]
fn test_duplicate_epp() {
let src = "
%epp A \"a\"
%epp A \"a\"
%epp A \"a\"
%%
";
parse(YaccKind::Eco, src).expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateEPP,
&mut [(2, 14), (3, 14), (4, 14)].into_iter(),
);
}
#[test]
fn test_multiple_duplicate_epp() {
let src = "
%epp A \"a1\"
%epp A \"a2\"
%epp A \"a3\"
%epp B \"b1\"
%epp B \"b2\"
%epp B \"b3\"
%%
";
parse(YaccKind::Eco, src).expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateEPP,
vec![(2, 14), (3, 14), (4, 14)],
),
(
YaccGrammarErrorKind::DuplicateEPP,
vec![(5, 14), (6, 14), (7, 14)],
),
]
.into_iter(),
);
}
#[test]
fn test_broken_string() {
let src = "
%epp A \"a
%%
";
parse(YaccKind::Eco, src).expect_error_at_line(src, YaccGrammarErrorKind::InvalidString, 2);
let src = "
%epp A \"a";
parse(YaccKind::Eco, src).expect_error_at_line(src, YaccGrammarErrorKind::InvalidString, 2);
}
#[test]
fn test_duplicate_start() {
let src = "
%start X
%start X
%%
";
parse(YaccKind::Eco, src).expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateStartDeclaration,
&mut [(2, 18), (3, 18)].into_iter(),
);
}
#[test]
fn test_duplicate_start_premature_end() {
let src = "
%start X
%start X";
parse(YaccKind::Eco, src).expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateStartDeclaration,
vec![(2, 18), (3, 18)],
),
(YaccGrammarErrorKind::PrematureEnd, vec![(3, 19)]),
]
.into_iter(),
);
}
#[test]
fn test_duplicate_expect() {
let src = "
%expect 1
%expect 2
%expect 3
%%
";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateExpectDeclaration,
&mut [(2, 19), (3, 19), (4, 19)].into_iter(),
)
}
#[test]
fn test_duplicate_expect_and_missing_colon() {
let src = "
%expect 1
%expect 2
%expect 3
%%
A ;";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateExpectDeclaration,
vec![(2, 19), (3, 19), (4, 19)],
),
(YaccGrammarErrorKind::MissingColon, vec![(6, 13)]),
]
.into_iter(),
)
}
#[test]
fn test_duplicate_expectrr() {
let src = "
%expect-rr 1
%expect-rr 2
%expect-rr 3
%%
";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateExpectRRDeclaration,
&mut [(2, 22), (3, 22), (4, 22)].into_iter(),
);
}
#[test]
fn test_duplicate_expectrr_illegal_name() {
let src = "
%expect-rr 1
%expect-rr 2
%expect-rr 3
%%
+IllegalRuleName+:;";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateExpectRRDeclaration,
vec![(2, 22), (3, 22), (4, 22)],
),
(YaccGrammarErrorKind::IllegalName, vec![(6, 11)]),
]
.into_iter(),
);
}
#[test]
fn test_implicit_start() {
let ast = parse(
YaccKind::Eco,
"
%%
R: ;
R2: ;
R3: ;
",
)
.unwrap();
assert_eq!(ast.start, Some(("R".to_string(), Span::new(24, 25))));
}
#[test]
fn test_action() {
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
"
%%
A: 'a' B { println!(\"test\"); }
;
B: 'b' 'c' { add($1, $2); }
| 'd'
;
D: 'd' {}
;
",
)
.unwrap();
assert_eq!(
grm.prods[grm.rules["A"].pidxs[0]].action,
Some("println!(\"test\");".to_string())
);
assert_eq!(
grm.prods[grm.rules["B"].pidxs[0]].action,
Some("add($1, $2);".to_string())
);
assert_eq!(grm.prods[grm.rules["B"].pidxs[1]].action, None);
}
#[test]
fn test_action_ends_in_multibyte() {
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
"%%A: '_' {(); // 🦀};",
)
.unwrap();
assert_eq!(
grm.prods[grm.rules["A"].pidxs[0]].action,
Some("(); // 🦀".to_string())
);
}
#[test]
fn test_programs() {
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
"
%%
A: 'a';
%%
fn foo() {}",
)
.unwrap();
assert_eq!(grm.programs, Some("fn foo() {}".to_string()));
}
#[test]
fn test_actions_with_newlines() {
let src = "
%%
A: 'a' { foo();
bar(); }
;
B: b';";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_line(src, YaccGrammarErrorKind::IllegalString, 6);
}
#[test]
fn test_comments() {
let src = "
// A valid comment
%token a
/* Another valid comment */
%%\n
A : a;";
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.unwrap();
assert!(grm.has_token("a"));
let src = "
/* An invalid comment * /
%token a
%%\n
A : a;";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_line(src, YaccGrammarErrorKind::IncompleteComment, 2);
let src = "
%token a
%%
/* A valid
* multi-line comment
*/
/* An invalid comment * /
A : a;";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_line(src, YaccGrammarErrorKind::IncompleteComment, 7);
let src = "
%token a
%%
// Valid comment
A : a";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_line(src, YaccGrammarErrorKind::IncompleteRule, 5);
}
#[test]
fn test_action_type() {
let grm = parse(
YaccKind::Original(YaccOriginalActionKind::UserAction),
"
%actiontype T
%%
A: 'a';
%%
fn foo() {}",
)
.unwrap();
assert_eq!(grm.rules["A"].actiont, Some("T".to_string()));
}
#[test]
fn test_only_one_type() {
let src = "
%actiontype T1
%actiontype T2
%actiontype T3
%%
A: 'a';";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_error_at_lines_cols(
src,
YaccGrammarErrorKind::DuplicateActiontypeDeclaration,
&mut [(2, 22), (3, 22), (4, 22)].into_iter(),
);
}
#[test]
fn test_duplicate_actiontype_and_premature_end() {
let src = "
%actiontype T1
%actiontype T2
%actiontype T3";
parse(
YaccKind::Original(YaccOriginalActionKind::GenericParseTree),
src,
)
.expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateActiontypeDeclaration,
vec![(2, 22), (3, 22), (4, 22)],
),
(YaccGrammarErrorKind::PrematureEnd, vec![(4, 24)]),
]
.into_iter(),
)
}
#[test]
fn test_parse_param() {
let src = "
%parse-param a::b: (u64, u64)
%%
A: 'a';
";
let grm = parse(YaccKind::Original(YaccOriginalActionKind::UserAction), src).unwrap();
assert_eq!(
grm.parse_param,
Some(("a::b".to_owned(), "(u64, u64)".to_owned()))
);
}
#[test]
fn test_duplicate_rule() {
let ast = parse(
YaccKind::Grmtools,
"%token A B D
%%
Expr -> () : %empty | A;
Expr -> () : B | 'C';
Expr -> () : D;
",
)
.unwrap();
let expr_rule = ast.get_rule("Expr").unwrap();
let mut prod_names = HashSet::new();
for pidx in &expr_rule.pidxs {
for sym in &ast.prods[*pidx].symbols {
let name = match sym {
Symbol::Token(name, _) | Symbol::Rule(name, _) => name.clone(),
};
prod_names.insert(name);
}
}
assert_eq!(ast.prods.len(), 5);
assert_eq!(
prod_names,
HashSet::from_iter(["A", "B", "C", "D"].map(|s| s.to_owned()))
);
}
#[test]
fn test_duplicate_start_and_missing_arrow() {
let src = "%start A
%start A
%start A
%%
A -> () : 'a1';
B";
parse(YaccKind::Grmtools, src).expect_multiple_errors(
src,
&mut [
(
YaccGrammarErrorKind::DuplicateStartDeclaration,
vec![(1, 8), (2, 8), (3, 8)],
),
(YaccGrammarErrorKind::MissingRightArrow, vec![(6, 2)]),
]
.into_iter(),
)
}
#[test]
fn test_routines_multiple_errors() {
let mut src = String::from(
"
%start A
%start B
%expect 1
%expect 2
%%
A -> () : 'a';
%%
",
);
let mut expected_errs = vec![
(
YaccGrammarErrorKind::DuplicateStartDeclaration,
vec![(2, 16), (3, 16)],
),
(
YaccGrammarErrorKind::DuplicateExpectDeclaration,
vec![(4, 17), (5, 17)],
),
];
parse(YaccKind::Grmtools, &src)
.expect_multiple_errors(&src, &mut expected_errs.clone().into_iter());
src.push_str(
"
/* Incomplete comment
",
);
expected_errs.push((YaccGrammarErrorKind::IncompleteComment, vec![(10, 17)]));
parse(YaccKind::Grmtools, &src)
.expect_multiple_errors(&src, &mut expected_errs.clone().into_iter());
}
#[test]
fn test_expect_unused() {
let src = r#"
%expect-unused A 'b' "c"
%%
A: ;
"#;
let grm = parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).unwrap();
assert!(grm
.expect_unused
.contains(&Symbol::Rule("A".to_string(), Span::new(24, 25))));
assert!(grm
.expect_unused
.contains(&Symbol::Token("b".to_string(), Span::new(27, 28))));
assert!(grm
.expect_unused
.contains(&Symbol::Token("c".to_string(), Span::new(31, 32))));
}
#[test]
fn test_bad_expect_unused() {
let src = "
%expect-unused %
%%
A: ;
";
parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).expect_error_at_line_col(
src,
YaccGrammarErrorKind::UnknownDeclaration,
2,
24,
);
}
#[test]
fn test_unused_symbols() {
let ast = parse(
YaccKind::Original(YaccOriginalActionKind::NoAction),
"
%expect-unused UnusedAllowed 'b'
%token a b
%start Start
%%
Unused: ;
Start: ;
UnusedAllowed: ;
",
)
.unwrap();
assert_eq!(
ast.unused_symbols()
.map(|sym_idx| { sym_idx.symbol(&ast) })
.collect::<Vec<Symbol>>()
.as_slice(),
&[
Symbol::Rule("Unused".to_string(), Span::new(101, 107)),
Symbol::Token("a".to_string(), Span::new(57, 58))
]
);
let ast = parse(
YaccKind::Original(YaccOriginalActionKind::NoAction),
"
%start A
%%
A: ;
Rec: Rec | ;
",
)
.unwrap();
assert_eq!(
ast.unused_symbols()
.map(|sym_idx| sym_idx.symbol(&ast))
.collect::<Vec<Symbol>>()
.as_slice(),
&[Symbol::Rule("Rec".to_string(), Span::new(50, 53))]
);
let ast = parse(
YaccKind::Original(YaccOriginalActionKind::NoAction),
"
%%
A: 'a' | 'z' ;
B: 'a' | 'c' ;
",
)
.unwrap();
assert_eq!(
ast.unused_symbols()
.map(|sym_idx| sym_idx.symbol(&ast))
.collect::<Vec<Symbol>>()
.as_slice(),
&[
Symbol::Rule("B".to_string(), Span::new(43, 44)),
Symbol::Token("c".to_string(), Span::new(53, 54))
]
);
}
#[test]
fn test_percent_empty() {
parse(
YaccKind::Original(YaccOriginalActionKind::NoAction),
r#"
%token a
%start A
%%
A: %empty | "a";
"#,
)
.unwrap();
let src = r#"
%token a b
%start A
%%
A: "a" | %empty | "b";
B: %empty | "b";
"#;
parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).unwrap();
let src = r#"
%token a
%start A
%%
A: %empty "a";
"#;
parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).expect_error_at_line_col(
src,
YaccGrammarErrorKind::NonEmptyProduction,
5,
12,
);
let src = r#"
%token a
%start A
%%
A: "a" %empty;
"#;
parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).expect_error_at_line_col(
src,
YaccGrammarErrorKind::NonEmptyProduction,
5,
16,
);
}
#[test]
fn test_action_successor() {
let src = "
%%
A: B {} B;
B: ;
";
parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).expect_error_at_line_col(
src,
YaccGrammarErrorKind::ProductionNotTerminated,
3,
17,
);
let src = "
%%
A: B B {};
B: {} ;
";
parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).unwrap();
}
#[test]
fn test_grmtools_section_yacckinds() {
let srcs = [
"%grmtools{yacckind: Original(NoAction)}
%%
Start: ;",
"%grmtools{yacckind: YaccKind::Original(GenericParseTree)}
%%
Start: ;",
"%grmtools{yacckind: YaccKind::Original(yaccoriginalactionkind::useraction)}
%actiontype ()
%%
Start: ;",
"%grmtools{yacckind: Original(YACCOriginalActionKind::NoAction)}
%%
Start: ;",
"%grmtools{yacckind: YaccKind::Grmtools}
%%
Start -> () : ;",
];
for src in srcs {
YaccParser::new(YaccKindResolver::NoDefault, src.to_string())
.parse()
.unwrap();
}
}
#[test]
fn test_grmtools_section_invalid_yacckinds() {
let srcs = [
"%grmtools{yacckind: Foo}",
"%grmtools{yacckind: YaccKind::Foo}",
"%grmtools{yacckindof: YaccKind::Grmtools}",
"%grmtools{yacckindof: Grmtools}",
"%grmtools{yacckindof: YaccKindFoo::Foo}",
"%grmtools{yacckind: Foo::Grmtools}",
"%grmtools{yacckind: YaccKind::Original}",
"%grmtools{yacckind: YaccKind::OriginalFoo}",
"%grmtools{yacckind: YaccKind::Original()}",
"%grmtools{yacckind: YaccKind::Original(Foo)}",
"%grmtools{yacckind: YaccKind::Original(YaccOriginalActionKind)}",
"%grmtools{yacckind: YaccKind::Original(YaccOriginalActionKind::Foo)}",
"%grmtools{yacckind: YaccKind::Original(Foo::NoActions)}",
"%grmtools{yacckind: YaccKind::Original(Foo::NoActionsBar)}",
];
for src in srcs {
let s = format!("{}\n%%\nStart();\n", src);
let parse_result = YaccParser::new(YaccKindResolver::NoDefault, s.to_string()).parse();
assert!(parse_result.is_err());
}
}
#[test]
fn test_grmtools_section_commas() {
let src = r#"
%grmtools{
yacckind: YaccKind::Grmtools,
}
%%
Start -> () : ;
"#;
YaccParser::new(YaccKindResolver::NoDefault, src.to_string())
.parse()
.unwrap();
let src = r#"
%grmtools{
yacckind: YaccKind::Grmtools
}
%%
Start -> () : ;
"#;
YaccParser::new(YaccKindResolver::NoDefault, src.to_string())
.parse()
.unwrap();
}
#[test]
fn test_empty_production_spans_issue_473() {
let empty_prod_conflicts = [
(
"%start Expr
%%
Expr: %empty | Factor;
Factor: ')' Expr ')';
",
(0, Span::new(21, 27)),
),
(
"%start Expr
%%
Expr: | Factor;
Factor: ')' Expr ')';
",
(0, Span::new(21, 21)),
),
(
"%start Expr
%%
Expr:| Factor;
Factor: ')' Expr ')';
",
(0, Span::new(20, 20)),
),
(
"%start Expr
%%
Expr: Factor | %empty;
Factor: ')' Expr ')';
",
(1, Span::new(30, 36)),
),
(
"%start Expr
%%
Expr: Factor | ;
Factor: ')' Expr ')';
",
(1, Span::new(30, 30)),
),
(
"%start Expr
%%
Expr: Factor|;
Factor: ')' Expr ')';
",
(1, Span::new(28, 28)),
),
];
for (i, (src, (empty_pidx, empty_span))) in empty_prod_conflicts.iter().enumerate() {
eprintln!("{}", i);
let ast = parse(YaccKind::Original(YaccOriginalActionKind::NoAction), src).unwrap();
assert_eq!(
ast.prods[ast.get_rule("Expr").unwrap().pidxs[*empty_pidx]],
Production {
symbols: vec![],
precedence: None,
action: None,
prod_span: *empty_span,
}
);
}
}
}