Simplify parsing by expecting the tokens stream will never be exhausted.

This commit is contained in:
Stephen Chung 2020-04-23 13:24:24 +08:00
parent a4bf572d5a
commit 5aaaa7be3b
3 changed files with 91 additions and 103 deletions

View File

@ -178,7 +178,7 @@ fn optimize_stmt<'a>(stmt: Stmt, state: &mut State<'a>, preserve_result: bool) -
Box::new(optimize_expr(expr, state)), Box::new(optimize_expr(expr, state)),
Box::new(optimize_stmt(*if_block, state, true)), Box::new(optimize_stmt(*if_block, state, true)),
match optimize_stmt(*else_block, state, true) { match optimize_stmt(*else_block, state, true) {
stmt if matches!(stmt, Stmt::Noop(_)) => None, // Noop -> no else block Stmt::Noop(_) => None, // Noop -> no else block
stmt => Some(Box::new(stmt)), stmt => Some(Box::new(stmt)),
}, },
), ),

View File

@ -508,19 +508,17 @@ impl Expr {
/// Consume a particular token, checking that it is the expected one. /// Consume a particular token, checking that it is the expected one.
fn eat_token(input: &mut Peekable<TokenIterator>, token: Token) -> Position { fn eat_token(input: &mut Peekable<TokenIterator>, token: Token) -> Position {
if let Some((t, pos)) = input.next() { let (t, pos) = input.next().unwrap();
if t != token {
panic!( if t != token {
"expecting {} (found {}) at {}", panic!(
token.syntax(), "expecting {} (found {}) at {}",
t.syntax(), token.syntax(),
pos t.syntax(),
); pos
} );
pos
} else {
panic!("expecting {} but already EOF", token.syntax());
} }
pos
} }
/// Match a particular token, consuming it if matched. /// Match a particular token, consuming it if matched.
@ -1269,103 +1267,91 @@ fn parse_binary_op<'a>(
return Ok(current_lhs); return Ok(current_lhs);
} }
if let Some((op_token, pos)) = input.next() { let (op_token, pos) = input.next().unwrap();
let rhs = parse_unary(input, allow_stmt_expr)?;
let next_precedence = if let Some((next_op, _)) = input.peek() { let rhs = parse_unary(input, allow_stmt_expr)?;
next_op.precedence()
} else {
0
};
// Bind to right if the next operator has higher precedence let next_precedence = input.peek().unwrap().0.precedence();
// If same precedence, then check if the operator binds right
let rhs = if (current_precedence == next_precedence && bind_right)
|| current_precedence < next_precedence
{
parse_binary_op(input, current_precedence, rhs, allow_stmt_expr)?
} else {
// Otherwise bind to left (even if next operator has the same precedence)
rhs
};
current_lhs = match op_token { // Bind to right if the next operator has higher precedence
Token::Plus => Expr::FunctionCall("+".into(), vec![current_lhs, rhs], None, pos), // If same precedence, then check if the operator binds right
Token::Minus => Expr::FunctionCall("-".into(), vec![current_lhs, rhs], None, pos), let rhs = if (current_precedence == next_precedence && bind_right)
Token::Multiply => { || current_precedence < next_precedence
Expr::FunctionCall("*".into(), vec![current_lhs, rhs], None, pos) {
} parse_binary_op(input, current_precedence, rhs, allow_stmt_expr)?
Token::Divide => Expr::FunctionCall("/".into(), vec![current_lhs, rhs], None, pos), } else {
// Otherwise bind to left (even if next operator has the same precedence)
rhs
};
Token::LeftShift => { current_lhs = match op_token {
Expr::FunctionCall("<<".into(), vec![current_lhs, rhs], None, pos) Token::Plus => Expr::FunctionCall("+".into(), vec![current_lhs, rhs], None, pos),
} Token::Minus => Expr::FunctionCall("-".into(), vec![current_lhs, rhs], None, pos),
Token::RightShift => { Token::Multiply => Expr::FunctionCall("*".into(), vec![current_lhs, rhs], None, pos),
Expr::FunctionCall(">>".into(), vec![current_lhs, rhs], None, pos) Token::Divide => Expr::FunctionCall("/".into(), vec![current_lhs, rhs], None, pos),
}
Token::Modulo => Expr::FunctionCall("%".into(), vec![current_lhs, rhs], None, pos),
Token::PowerOf => Expr::FunctionCall("~".into(), vec![current_lhs, rhs], None, pos),
// Comparison operators default to false when passed invalid operands Token::LeftShift => Expr::FunctionCall("<<".into(), vec![current_lhs, rhs], None, pos),
Token::EqualsTo => { Token::RightShift => Expr::FunctionCall(">>".into(), vec![current_lhs, rhs], None, pos),
Expr::FunctionCall("==".into(), vec![current_lhs, rhs], Some(false.into()), pos) Token::Modulo => Expr::FunctionCall("%".into(), vec![current_lhs, rhs], None, pos),
} Token::PowerOf => Expr::FunctionCall("~".into(), vec![current_lhs, rhs], None, pos),
Token::NotEqualsTo => {
Expr::FunctionCall("!=".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::LessThan => {
Expr::FunctionCall("<".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::LessThanEqualsTo => {
Expr::FunctionCall("<=".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::GreaterThan => {
Expr::FunctionCall(">".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::GreaterThanEqualsTo => {
Expr::FunctionCall(">=".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::Or => Expr::Or(Box::new(current_lhs), Box::new(rhs), pos), // Comparison operators default to false when passed invalid operands
Token::And => Expr::And(Box::new(current_lhs), Box::new(rhs), pos), Token::EqualsTo => {
Token::Ampersand => { Expr::FunctionCall("==".into(), vec![current_lhs, rhs], Some(false.into()), pos)
Expr::FunctionCall("&".into(), vec![current_lhs, rhs], None, pos) }
} Token::NotEqualsTo => {
Token::Pipe => Expr::FunctionCall("|".into(), vec![current_lhs, rhs], None, pos), Expr::FunctionCall("!=".into(), vec![current_lhs, rhs], Some(false.into()), pos)
Token::XOr => Expr::FunctionCall("^".into(), vec![current_lhs, rhs], None, pos), }
Token::LessThan => {
Expr::FunctionCall("<".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::LessThanEqualsTo => {
Expr::FunctionCall("<=".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::GreaterThan => {
Expr::FunctionCall(">".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::GreaterThanEqualsTo => {
Expr::FunctionCall(">=".into(), vec![current_lhs, rhs], Some(false.into()), pos)
}
Token::In => parse_in_expr(current_lhs, rhs, pos)?, Token::Or => Expr::Or(Box::new(current_lhs), Box::new(rhs), pos),
Token::And => Expr::And(Box::new(current_lhs), Box::new(rhs), pos),
Token::Ampersand => Expr::FunctionCall("&".into(), vec![current_lhs, rhs], None, pos),
Token::Pipe => Expr::FunctionCall("|".into(), vec![current_lhs, rhs], None, pos),
Token::XOr => Expr::FunctionCall("^".into(), vec![current_lhs, rhs], None, pos),
#[cfg(not(feature = "no_object"))] Token::In => parse_in_expr(current_lhs, rhs, pos)?,
Token::Period => {
fn check_property(expr: Expr) -> Result<Expr, Box<ParseError>> { #[cfg(not(feature = "no_object"))]
match expr { Token::Period => {
// xxx.lhs.rhs fn check_property(expr: Expr) -> Result<Expr, Box<ParseError>> {
Expr::Dot(lhs, rhs, pos) => Ok(Expr::Dot( match expr {
Box::new(check_property(*lhs)?), // xxx.lhs.rhs
Box::new(check_property(*rhs)?), Expr::Dot(lhs, rhs, pos) => Ok(Expr::Dot(
pos, Box::new(check_property(*lhs)?),
)), Box::new(check_property(*rhs)?),
// xxx.lhs[idx] pos,
Expr::Index(lhs, idx, pos) => { )),
Ok(Expr::Index(Box::new(check_property(*lhs)?), idx, pos)) // xxx.lhs[idx]
} Expr::Index(lhs, idx, pos) => {
// xxx.id Ok(Expr::Index(Box::new(check_property(*lhs)?), idx, pos))
Expr::Variable(id, pos) => Ok(Expr::Property(id, pos)),
// xxx.prop
expr @ Expr::Property(_, _) => Ok(expr),
// xxx.fn()
expr @ Expr::FunctionCall(_, _, _, _) => Ok(expr),
expr => Err(PERR::PropertyExpected.into_err(expr.position())),
} }
// xxx.id
Expr::Variable(id, pos) => Ok(Expr::Property(id, pos)),
// xxx.prop
expr @ Expr::Property(_, _) => Ok(expr),
// xxx.fn()
expr @ Expr::FunctionCall(_, _, _, _) => Ok(expr),
expr => Err(PERR::PropertyExpected.into_err(expr.position())),
} }
Expr::Dot(Box::new(current_lhs), Box::new(check_property(rhs)?), pos)
} }
token => return Err(PERR::UnknownOperator(token.syntax().into()).into_err(pos)), Expr::Dot(Box::new(current_lhs), Box::new(check_property(rhs)?), pos)
}; }
}
token => return Err(PERR::UnknownOperator(token.syntax().into()).into_err(pos)),
};
} }
} }
@ -1439,7 +1425,7 @@ fn parse_if<'a>(
// if guard { if_body } else ... // if guard { if_body } else ...
let else_body = if match_token(input, Token::Else).unwrap_or(false) { let else_body = if match_token(input, Token::Else).unwrap_or(false) {
Some(Box::new(if matches!(input.peek(), Some((Token::If, _))) { Some(Box::new(if let (Token::If, _) = input.peek().unwrap() {
// if guard { if_body } else if ... // if guard { if_body } else if ...
parse_if(input, breakable, allow_stmt_expr)? parse_if(input, breakable, allow_stmt_expr)?
} else { } else {
@ -1676,9 +1662,9 @@ fn parse_stmt<'a>(
Token::Return | Token::Throw => { Token::Return | Token::Throw => {
let pos = *pos; let pos = *pos;
let return_type = match input.next() { let return_type = match input.next().unwrap() {
Some((Token::Return, _)) => ReturnType::Return, (Token::Return, _) => ReturnType::Return,
Some((Token::Throw, _)) => ReturnType::Exception, (Token::Throw, _) => ReturnType::Exception,
_ => panic!("token should be return or throw"), _ => panic!("token should be return or throw"),
}; };
@ -1819,7 +1805,7 @@ fn parse_global_level<'a>(
// Collect all the function definitions // Collect all the function definitions
#[cfg(not(feature = "no_function"))] #[cfg(not(feature = "no_function"))]
{ {
if matches!(input.peek().expect("should not be None"), (Token::Fn, _)) { if let (Token::Fn, _) = input.peek().unwrap() {
let f = parse_fn(input, true)?; let f = parse_fn(input, true)?;
functions.insert(calc_fn_def(&f.name, f.params.len()), f); functions.insert(calc_fn_def(&f.name, f.params.len()), f);
continue; continue;

View File

@ -991,6 +991,8 @@ impl<'a> TokenIterator<'a> {
} }
('~', _) => return Some((Token::PowerOf, pos)), ('~', _) => return Some((Token::PowerOf, pos)),
('\0', _) => panic!("should not be EOF"),
(ch, _) if ch.is_whitespace() => (), (ch, _) if ch.is_whitespace() => (),
(ch, _) => return Some((Token::LexError(Box::new(LERR::UnexpectedChar(ch))), pos)), (ch, _) => return Some((Token::LexError(Box::new(LERR::UnexpectedChar(ch))), pos)),
} }