glox/parser.go

629 lines
11 KiB
Go
Raw Permalink Normal View History

2024-10-03 22:12:40 +03:00
package main
import (
2024-10-14 22:53:26 +03:00
"errors"
2024-10-03 22:12:40 +03:00
"fmt"
)
type Parser struct {
tokens []Token
current int
2024-10-05 18:58:49 +03:00
errors []error
2024-10-03 22:12:40 +03:00
}
type ParseError struct {
token Token
message string
}
2024-10-05 18:58:49 +03:00
func (pe *ParseError) Error() string {
2024-11-02 18:23:58 +02:00
return fmt.Sprintf(
"ParseError [%d][%s]: %s",
pe.token.line,
pe.token.typ,
pe.message,
)
2024-10-03 22:12:40 +03:00
}
func newParser(tokens []Token) *Parser {
return &Parser{
tokens: tokens,
current: 0,
}
}
2024-10-05 18:58:49 +03:00
// program -> declaration* EOF
2024-10-14 22:53:26 +03:00
func (p *Parser) parse() ([]Stmt, error) {
2024-10-03 22:12:40 +03:00
defer p.recover()
2024-10-05 18:58:49 +03:00
stmts := []Stmt{}
for !p.isAtEnd() {
if stmt := p.declaration(); stmt != nil {
stmts = append(stmts, stmt)
}
}
2024-10-14 22:53:26 +03:00
return stmts, errors.Join(p.errors...)
2024-10-03 22:12:40 +03:00
}
2024-11-06 00:09:50 +02:00
// declaration ->
// varDecl | funDecl | classDecl | statement
2024-10-05 18:58:49 +03:00
func (p *Parser) declaration() Stmt {
defer p.synchronize()
if p.match(VAR) {
return p.varDecl()
2024-10-03 22:12:40 +03:00
}
2024-10-09 23:36:18 +03:00
if p.match(FUN) {
return p.function("function")
}
2024-11-06 00:09:50 +02:00
if p.match(CLASS) {
return p.classDecl()
}
2024-10-05 18:58:49 +03:00
return p.statement()
2024-10-03 22:12:40 +03:00
}
2024-10-05 18:58:49 +03:00
// varDecl -> "var" IDENTIFIER ("=" expression)? ";"
func (p *Parser) varDecl() Stmt {
2024-10-09 23:36:18 +03:00
name := p.consume(IDENTIFIER, "Expect identifier for variable")
2024-10-05 18:58:49 +03:00
var initializer Expr = nil
if p.match(EQUAL) {
initializer = p.expression()
}
p.consume(SEMICOLON, "Expect ';' after expression.")
return &VarStmt{name, initializer}
}
2024-11-06 00:09:50 +02:00
// classDecl -> "class" IDENTIFIER "{" function* "}"
func (p *Parser) classDecl() Stmt {
name := p.consume(IDENTIFIER, "Expect identifier for variable")
p.consume(LEFT_BRACE, "Expect '{' after class identifier")
methods := []FunStmt{}
for !p.isAtEnd() && !p.check(RIGHT_BRACE) {
methods = append(methods, *p.function("method"))
}
p.consume(RIGHT_BRACE, "Expect '}' after class definition")
return &ClassStmt{name, methods}
}
2024-10-09 23:36:18 +03:00
// funDecl -> "fun" function
// function -> IDENTIFIER "(" parameters? ")" blockStmt
// parameters -> IDENTIFIER ( "," IDENTIFIER )*
2024-11-06 00:09:50 +02:00
func (p *Parser) function(kind string) *FunStmt {
2024-10-09 23:36:18 +03:00
name := p.consume(IDENTIFIER, fmt.Sprintf("Expect %s name.", kind))
p.consume(LEFT_PAREN, fmt.Sprintf("Expect '(' after %s name.", kind))
args := []Token{}
for !p.check(RIGHT_PAREN) {
args = append(
args,
p.consume(
IDENTIFIER,
fmt.Sprintf("Expect %s argument.", kind),
),
)
if p.check(COMMA) {
p.advance()
}
}
p.consume(RIGHT_PAREN, fmt.Sprintf("Expect ')' after %s name.", kind))
p.consume(LEFT_BRACE, fmt.Sprintf("Expect '{' after %s arguments.", kind))
2024-10-14 22:53:26 +03:00
body := p.block()
2024-10-09 23:36:18 +03:00
return &FunStmt{name, args, body}
}
2024-10-07 21:06:23 +03:00
// statement -> exprStmt
//
// | whileStmt
2024-10-08 20:32:13 +03:00
// | forStmt
2024-10-07 21:06:23 +03:00
// | printStmt
// | blockStmt
2024-10-07 21:47:55 +03:00
// | breakStmt
2024-10-07 21:06:23 +03:00
// | ifStmt
2024-10-11 17:01:12 +03:00
// | returnStmt
2024-10-07 21:06:23 +03:00
// | env
2024-10-05 18:58:49 +03:00
func (p *Parser) statement() Stmt {
if p.match(PRINT) {
return p.printStmt()
}
2024-10-05 23:27:00 +03:00
if p.match(LEFT_BRACE) {
2024-10-07 21:06:23 +03:00
return p.blockStmt()
2024-10-05 23:27:00 +03:00
}
2024-10-06 16:30:57 +03:00
if p.match(IF) {
return p.ifStmt()
}
if p.match(ENV) {
return p.envStmt()
}
2024-10-07 21:06:23 +03:00
if p.match(WHILE) {
return p.whileStmt()
}
2024-10-08 20:32:13 +03:00
if p.match(FOR) {
return p.forStmt()
}
2024-10-07 21:47:55 +03:00
if p.match(BREAK) {
return p.breakStmt()
}
2024-10-11 17:01:12 +03:00
if p.match(RETURN) {
return p.returnStmt()
}
2024-10-05 18:58:49 +03:00
return p.exprStmt()
}
// exprStmt -> expression ";"
func (p *Parser) exprStmt() Stmt {
expr := p.expression()
p.consume(SEMICOLON, "Expect ';' after expression.")
2024-10-06 16:30:57 +03:00
if expr == nil {
return nil
}
2024-10-05 18:58:49 +03:00
return &ExprStmt{expr}
}
// printStmt -> "print" expression ";"
func (p *Parser) printStmt() Stmt {
expr := p.expression()
2024-10-06 16:30:57 +03:00
if expr == nil {
p.panic(&ParseError{p.previous(), "Expect expression after 'print'"})
}
2024-10-05 18:58:49 +03:00
p.consume(SEMICOLON, "Expect ';' after expression.")
return &PrintStmt{expr}
}
2024-10-14 22:53:26 +03:00
func (p *Parser) block() []Stmt {
2024-10-05 23:27:00 +03:00
stmts := []Stmt{}
2024-10-06 16:30:57 +03:00
for !p.check(RIGHT_BRACE) && !p.isAtEnd() {
2024-10-05 23:27:00 +03:00
stmts = append(stmts, p.declaration())
}
p.consume(RIGHT_BRACE, "Unclosed block: Expected '}'.")
2024-10-14 22:53:26 +03:00
return stmts
}
// blockStmt -> "{" statement* "}"
func (p *Parser) blockStmt() *BlockStmt {
return &BlockStmt{p.block()}
2024-10-05 23:27:00 +03:00
}
2024-10-07 21:47:55 +03:00
// breakStmt -> break ";"
func (p *Parser) breakStmt() Stmt {
p.consume(SEMICOLON, "Expect ';' after break.")
return &BreakStmt{}
}
2024-10-06 16:30:57 +03:00
// if -> "if" "(" expression ")" statement ("else" statement)?
func (p *Parser) ifStmt() Stmt {
name := p.previous()
p.consume(LEFT_PAREN, "Expect '(' after 'if'.")
expr := p.expression()
p.consume(RIGHT_PAREN, "Expect ')' after 'if' condition.")
then := p.statement()
var or Stmt = nil
if p.match(ELSE) {
or = p.statement()
}
return &IfStmt{name, expr, then, or}
2024-10-07 21:06:23 +03:00
}
// while -> "while" "(" expression ")" statement
func (p *Parser) whileStmt() Stmt {
p.consume(LEFT_PAREN, "Expect '(' after 'while'.")
cond := p.expression()
p.consume(RIGHT_PAREN, "Expect ')' after 'while' expression.")
body := p.statement()
return &WhileStmt{cond, body}
2024-10-06 16:30:57 +03:00
}
2024-10-08 20:32:13 +03:00
// for -> "for" ( "(" ( varDecl | exprStmt | ";" ) expression? ";" expression ")" )? statement
func (p *Parser) forStmt() Stmt {
if p.check(LEFT_BRACE) {
return &WhileStmt{&Literal{true}, p.statement()}
}
p.consume(LEFT_PAREN, "Expect '(' after 'for'.")
var init Stmt
if p.match(SEMICOLON) {
init = nil
} else if p.match(VAR) {
init = p.varDecl()
} else {
init = p.exprStmt()
}
var cond Expr
if !p.check(SEMICOLON) {
cond = p.expression()
}
p.consume(SEMICOLON, "Expect ';' after for loop condition;")
var incr Expr
if !p.check(RIGHT_PAREN) {
incr = p.expression()
}
p.consume(RIGHT_PAREN, "Expect ')' after for clauses;")
var body = p.statement()
if incr != nil {
body = &BlockStmt{[]Stmt{body, &ExprStmt{incr}}}
}
if cond == nil {
cond = &Literal{true}
}
body = &WhileStmt{cond, body}
if init != nil {
body = &BlockStmt{[]Stmt{init, body}}
}
return body
}
2024-10-06 16:30:57 +03:00
// env -> "env" ";"
func (p *Parser) envStmt() Stmt {
p.consume(SEMICOLON, "Expect ';' after 'env'.")
return &EnvStmt{}
}
2024-10-11 17:01:12 +03:00
// return -> "return" expression ";"
func (p *Parser) returnStmt() Stmt {
ret := p.expression()
p.consume(SEMICOLON, "Expect ';' after return;")
return &ReturnStmt{ret}
}
2024-10-05 18:58:49 +03:00
// expression -> assignment
2024-10-03 22:12:40 +03:00
func (p *Parser) expression() Expr {
2024-10-05 18:58:49 +03:00
return p.assignment()
}
2024-10-06 17:15:50 +03:00
// assignment -> IDENTIFIER "=" assignment | or
2024-10-05 18:58:49 +03:00
func (p *Parser) assignment() Expr {
2024-10-06 17:15:50 +03:00
expr := p.or()
2024-10-05 18:58:49 +03:00
if p.match(EQUAL) {
eq := p.previous()
val := p.assignment()
if variable, ok := expr.(*Variable); ok {
return &Assign{variable.name, val}
}
p.panic(&ParseError{eq, "Invalid assignment target."})
}
return expr
2024-10-03 22:12:40 +03:00
}
2024-10-06 17:15:50 +03:00
// or -> and ( "or" and )*
func (p *Parser) or() Expr {
left := p.and()
2024-10-06 16:30:57 +03:00
for p.match(OR) {
or := p.previous()
2024-10-06 17:15:50 +03:00
right := p.and()
left = &Logical{left, or, right}
2024-10-06 16:30:57 +03:00
}
return left
}
2024-10-06 17:15:50 +03:00
// and -> equality ( "and" equality )*
func (p *Parser) and() Expr {
2024-10-06 16:30:57 +03:00
left := p.equality()
for p.match(AND) {
or := p.previous()
right := p.equality()
2024-10-06 17:15:50 +03:00
left = &Logical{left, or, right}
2024-10-06 16:30:57 +03:00
}
return left
}
2024-10-03 22:12:40 +03:00
// equality -> comparison ( ( "==" | "!=" ) comparison )*
func (p *Parser) equality() Expr {
expr := p.comparison()
for p.match(EQUAL_EQUAL, BANG_EQUAL) {
op := p.previous()
right := p.comparison()
expr = &Binary{expr, op, right}
}
return expr
}
// comparison -> term ( ( ">" | ">=" | "<" | "<=" ) term )*
func (p *Parser) comparison() Expr {
expr := p.term()
for p.match(GREATER, GREATER_EQUAL, LESS, LESS_EQUAL) {
op := p.previous()
right := p.term()
expr = &Binary{expr, op, right}
}
return expr
}
// term -> factor ( ( "-" | "+" ) factor )*
func (p *Parser) term() Expr {
expr := p.factor()
for p.match(MINUS, PLUS) {
op := p.previous()
right := p.factor()
expr = &Binary{expr, op, right}
}
return expr
}
// factor -> unary ( ( "/" | "*" ) unary )*
func (p *Parser) factor() Expr {
exp := p.unary()
for p.match(SLASH, STAR) {
op := p.previous()
right := p.unary()
2024-10-04 15:24:01 +03:00
exp = &Binary{exp, op, right}
2024-10-03 22:12:40 +03:00
}
return exp
}
// unary -> ( "!" | "-" ) unary | primary
func (p *Parser) unary() Expr {
if p.match(BANG, MINUS) {
op := p.previous()
right := p.unary()
return &Unary{op, right}
}
2024-10-09 19:57:52 +03:00
return p.call()
}
// call -> primary ( "(" arguments? ")" )*
func (p *Parser) call() Expr {
expr := p.primary()
for {
if p.match(LEFT_PAREN) {
expr = p.arguments(expr)
} else {
break
}
}
return expr
}
// arguments -> expression ( "," expression )*
func (p *Parser) arguments(callee Expr) Expr {
arguments := []Expr{}
if !p.check(RIGHT_PAREN) {
for {
arguments = append(arguments, p.expression())
if !p.match(COMMA) {
break
}
}
}
paren := p.consume(RIGHT_PAREN, "Expect ')' after arguments.")
return &Call{callee, paren, arguments}
2024-10-03 22:12:40 +03:00
}
2024-10-12 14:48:27 +03:00
// primary -> IDENTIFIER
//
// | NUMBER
// | STRING
// | "true"
// | "false"
// | "nil"
// | "(" expression ")"
// | lambda
2024-10-03 22:12:40 +03:00
func (p *Parser) primary() Expr {
switch {
case p.match(FALSE):
return &Literal{false}
case p.match(TRUE):
return &Literal{true}
case p.match(NIL):
return &Literal{nil}
}
2024-10-12 14:48:27 +03:00
if p.match(FUN) {
return p.lambda()
}
2024-10-03 22:12:40 +03:00
if p.match(NUMBER, STRING) {
return &Literal{p.previous().literal}
}
2024-10-05 18:58:49 +03:00
if p.match(IDENTIFIER) {
return &Variable{p.previous()}
}
2024-10-03 22:12:40 +03:00
if p.match(LEFT_PAREN) {
expr := p.expression()
p.consume(RIGHT_PAREN, "Expect ')' after expression")
return &Grouping{expr}
}
2024-10-07 21:47:55 +03:00
p.panic(&ParseError{p.peek(), "Expect expression"})
2024-10-03 22:12:40 +03:00
return nil
}
2024-10-12 14:48:27 +03:00
func (p *Parser) lambda() Expr {
name := p.previous()
p.consume(LEFT_PAREN, "Expect '(' before lambda arguments.")
args := []Token{}
for !p.check(RIGHT_PAREN) {
args = append(
args,
p.consume(
IDENTIFIER,
"Expect lambda argument.",
),
)
if p.check(COMMA) {
p.advance()
}
}
p.consume(RIGHT_PAREN, "Expect ')' after lambda arguments.")
p.consume(LEFT_BRACE, "Expect '{' before lambda body.")
2024-10-14 22:53:26 +03:00
body := p.block()
2024-10-12 14:48:27 +03:00
return &Lambda{name, args, body}
}
2024-10-03 22:12:40 +03:00
func (p *Parser) previous() Token {
return p.tokens[p.current-1]
}
func (p *Parser) peek() Token {
return p.tokens[p.current]
}
func (p *Parser) isAtEnd() bool {
return p.peek().typ == EOF
}
func (p *Parser) advance() Token {
if !p.isAtEnd() {
p.current++
}
return p.previous()
}
func (p *Parser) check(typ TokenType) bool {
if p.isAtEnd() {
return false
}
return p.peek().typ == typ
}
func (p *Parser) match(types ...TokenType) bool {
for _, typ := range types {
if p.check(typ) {
p.advance()
return true
}
}
return false
}
func (p *Parser) consume(typ TokenType, mes string) Token {
if p.check(typ) {
return p.advance()
}
2024-10-05 18:58:49 +03:00
p.panic(&ParseError{p.peek(), mes})
2024-10-03 22:12:40 +03:00
return Token{}
}
func (p *Parser) synchronize() {
2024-10-05 18:58:49 +03:00
err := recover()
pe := p.isParseError(err)
if pe == nil {
return
}
2024-10-03 22:12:40 +03:00
p.advance()
for !p.isAtEnd() {
if p.previous().typ == SEMICOLON {
return
}
switch p.peek().typ {
2024-10-06 16:30:57 +03:00
case CLASS, FOR, FUN, IF, PRINT, RETURN, VAR, WHILE, ENV:
2024-10-03 22:12:40 +03:00
return
}
p.advance()
}
2024-10-05 18:58:49 +03:00
}
func (p *Parser) recover() {
p.isParseError(recover())
}
func (p *Parser) panic(pe *ParseError) {
p.errors = append(p.errors, pe)
panic(pe)
}
func (p *Parser) isParseError(err any) *ParseError {
if err == nil {
return nil
}
pe, ok := err.(*ParseError)
if !ok {
panic(err)
}
return pe
2024-10-03 22:12:40 +03:00
}