vig/src/parser.zig

526 lines
14 KiB
Zig
Raw Normal View History

2019-06-05 01:11:11 +00:00
const std = @import("std");
const scanners = @import("scanner.zig");
const main = @import("main.zig");
const ast = @import("ast.zig");
const tokens = @import("tokens.zig");
2019-06-06 01:06:12 +00:00
const err = @import("errors.zig");
2019-06-05 01:11:11 +00:00
const Allocator = std.mem.Allocator;
const Scanner = scanners.Scanner;
const Token = tokens.Token;
const TokenType = tokens.TokenType;
const Result = main.Result;
2019-08-24 01:13:26 +00:00
const Node = ast.Node;
2019-08-24 01:13:26 +00:00
const Expr = ast.Expr;
2019-08-24 19:00:22 +00:00
const Stmt = ast.Stmt;
2019-06-06 01:06:12 +00:00
2019-06-05 01:11:11 +00:00
pub const Parser = struct {
allocator: *Allocator,
scanner: *Scanner,
2019-06-06 01:06:12 +00:00
tokens: []Token = undefined,
2019-06-05 01:11:11 +00:00
2019-08-23 14:57:49 +00:00
hadError: bool = false,
2019-06-05 01:11:11 +00:00
pub fn init(allocator: *Allocator, scanner: *Scanner) Parser {
return Parser{ .allocator = allocator, .scanner = scanner };
}
2019-08-23 14:57:49 +00:00
fn doError(self: *Parser, comptime fmt: []const u8, args: ...) void {
self.hadError = true;
2019-06-05 01:11:11 +00:00
std.debug.warn("parser error at line {}\n\t", self.scanner.line);
std.debug.warn(fmt, args);
std.debug.warn("\n");
}
2019-06-06 01:06:12 +00:00
fn peek(self: *Parser) Token {
2019-07-01 18:39:48 +00:00
return self.tokens[self.tokens.len - 1];
2019-06-06 01:06:12 +00:00
}
fn previous(self: *Parser) Token {
2019-07-01 18:39:48 +00:00
return self.tokens[self.tokens.len - 2];
2019-06-06 01:06:12 +00:00
}
fn tokenError(self: *Parser, token: Token, msg: []const u8) Result!void {
if (token.ttype == .EOF) {
err.report(token.line, " at end", msg);
} else {
err.reportFmt(token.line, " at '{}': {}", token.lexeme, msg);
2019-06-05 01:11:11 +00:00
}
2019-06-06 01:06:12 +00:00
return Result.CompileError;
2019-06-05 01:11:11 +00:00
}
2019-06-06 01:06:12 +00:00
fn isAtEnd(self: *Parser) bool {
return self.peek().ttype == .EOF;
}
fn check(self: *Parser, ttype: TokenType) bool {
if (self.isAtEnd()) return false;
return self.peek().ttype == ttype;
}
2019-07-01 18:39:48 +00:00
fn nextToken(self: *Parser) !Token {
var token: Token = undefined;
while (true) {
var next_token_opt = try self.scanner.nextToken();
if (next_token_opt) |token_nice| {
token = token_nice;
break;
2019-06-06 01:06:12 +00:00
}
}
2019-07-01 18:39:48 +00:00
self.tokens = try self.allocator.realloc(
self.tokens,
self.tokens.len + 1,
);
2019-06-06 01:06:12 +00:00
2019-07-01 18:39:48 +00:00
self.tokens[self.tokens.len - 1] = token;
std.debug.warn("skip to {}\n", token);
2019-07-01 18:39:48 +00:00
return token;
2019-06-06 01:06:12 +00:00
}
2019-07-01 18:39:48 +00:00
fn consume(self: *Parser, ttype: TokenType, comptime msg: []const u8) !Token {
if (self.check(ttype)) return try self.nextToken();
2019-06-06 01:06:12 +00:00
try self.tokenError(self.peek(), msg);
return Result.CompileError;
2019-06-05 01:11:11 +00:00
}
2019-07-01 18:25:07 +00:00
fn consumeSingle(self: *Parser, ttype: TokenType) !Token {
2019-07-01 18:39:48 +00:00
if (self.check(ttype)) {
var cur = self.peek();
_ = try self.nextToken();
2019-08-24 14:07:23 +00:00
std.debug.warn("consumed {}, now has {}\n", ttype, self.peek());
2019-07-01 18:39:48 +00:00
return cur;
}
2019-07-01 18:25:07 +00:00
var buf_main: [1000]u8 = undefined;
var buf = try std.fmt.bufPrint(
buf_main[0..],
"expected {}, got {}",
ttype,
self.peek().ttype,
);
try self.tokenError(self.peek(), buf);
return Result.CompileError;
}
2019-08-24 01:13:26 +00:00
fn compareAnyOf(self: *@This(), ttypes: []TokenType) bool {
for (ttypes) |ttype| {
2019-08-24 14:07:23 +00:00
if (self.check(ttype)) return true;
2019-08-24 01:13:26 +00:00
}
return false;
}
2019-08-24 19:00:22 +00:00
fn mkFnDecl(self: *Parser, name: Token, params: ast.ParamList, block: ast.StmtList) !*ast.Node {
2019-07-01 18:25:07 +00:00
var node = try self.allocator.create(Node);
2019-07-01 18:55:19 +00:00
node.* = Node{
.FnDecl = ast.FnDecl{
.func_name = name,
.params = params,
2019-08-24 14:07:23 +00:00
.body = block,
2019-07-01 18:55:19 +00:00
},
};
return node;
2019-06-06 01:06:12 +00:00
}
fn mkConstDecl(self: *Parser, consts: ast.ConstList) !*ast.Node {
var node = try self.allocator.create(Node);
node.* = Node{ .ConstDecl = consts };
return node;
}
2019-07-01 18:55:19 +00:00
2019-08-24 19:00:22 +00:00
fn mkBlock(self: *Parser, stmts: ast.StmtList) !*ast.Node {
2019-08-24 01:13:26 +00:00
var node = try self.allocator.create(Node);
2019-08-24 19:00:22 +00:00
node.* = Node{ .Block = stmts };
2019-08-24 01:13:26 +00:00
return node;
}
fn mkExpr(self: *Parser, expr: *Expr) !*ast.Node {
var node = try self.allocator.create(Node);
node.* = Node{ .Expr = expr };
return node;
}
2019-08-24 19:00:22 +00:00
fn mkStmt(self: *Parser, stmt: *Stmt) !*ast.Node {
var node = try self.allocator.create(Node);
node.* = Node{ .Stmt = stmt };
return node;
}
fn mkStmtExpr(self: *Parser, expr: *Expr) !*Stmt {
var stmt = try self.allocator.create(Stmt);
stmt.* = Stmt{ .Expr = expr };
return stmt;
}
2019-08-24 01:13:26 +00:00
fn mkGrouping(self: *Parser, expr: *Expr) !*ast.Expr {
var grouping = try self.allocator.create(Expr);
grouping.* = Expr{ .Grouping = expr };
return grouping;
}
fn mkUnary(self: *Parser, op: Token, right: *Expr) !*Expr {
2019-08-24 14:07:23 +00:00
std.debug.warn("Unary\n");
2019-08-24 01:13:26 +00:00
var expr = try self.allocator.create(Expr);
expr.* = Expr{
.Unary = ast.UnaryExpr{
.op = op,
.right = right,
},
};
return expr;
}
fn mkBinary(self: *Parser, left: *Expr, op: Token, right: *Expr) !*Expr {
2019-08-24 14:07:23 +00:00
std.debug.warn("Binary\n");
2019-08-24 01:13:26 +00:00
var expr = try self.allocator.create(Expr);
expr.* = Expr{
.Binary = ast.BinaryExpr{
.left = left,
.op = op,
.right = right,
},
};
return expr;
}
fn mkBool(self: *Parser, val: bool) !*ast.Expr {
var expr = try self.allocator.create(Expr);
expr.* = Expr{
.Literal = ast.LiteralExpr{
.Bool = val,
},
};
return expr;
}
fn mkInteger(self: *Parser, val: []const u8) !*ast.Expr {
var expr = try self.allocator.create(Expr);
expr.* = Expr{
.Literal = ast.LiteralExpr{
.Integer = val,
},
};
return expr;
}
fn mkFloat(self: *Parser, val: []const u8) !*ast.Expr {
var expr = try self.allocator.create(Expr);
expr.* = Expr{
.Literal = ast.LiteralExpr{
.Float = val,
},
};
return expr;
}
fn mkString(self: *Parser, val: []const u8) !*ast.Expr {
var expr = try self.allocator.create(Expr);
expr.* = Expr{
.Literal = ast.LiteralExpr{
.String = val,
},
};
return expr;
}
pub fn parse(self: *Parser) !*ast.Node {
self.tokens = try self.allocator.alloc(Token, 0);
var root = try ast.mkRoot(self.allocator);
var token_opt: ?Token = null;
while (true) {
if (token_opt == null) {
token_opt = try self.nextToken();
} else {
token_opt = self.peek();
}
var token = token_opt.?;
if (token.ttype == .EOF) break;
var node = try self.parseTopDecl();
if (node == null) continue;
try root.Root.append(node.?);
}
if (self.hadError) {
return error.ParseError;
}
return root;
}
fn functionDecl(self: *Parser) !*ast.Node {
2019-07-01 18:55:19 +00:00
// function body
2019-07-01 20:45:13 +00:00
_ = try self.nextToken();
2019-07-01 18:55:19 +00:00
_ = try self.consumeSingle(.LeftBrace);
2019-08-23 14:57:49 +00:00
var body = ast.NodeList.init(self.allocator);
2019-07-01 18:55:19 +00:00
while (true) {
var tok = self.peek();
if (tok.ttype == .RightBrace) break;
2019-08-23 14:57:49 +00:00
// TODO statements
//var node = try self.processToken(tok);
//std.debug.warn("stmt:{}\n", node);
//try body.append(node);
tok = try self.nextToken();
2019-07-01 18:55:19 +00:00
}
_ = try self.consumeSingle(.RightBrace);
return try self.mkFnDecl(name, param_list);
2019-06-06 01:06:12 +00:00
}
2019-08-23 14:57:49 +00:00
fn processToken(self: *Parser, token: Token) anyerror!*ast.Node {
2019-07-01 18:25:07 +00:00
var node = switch (token.ttype) {
.Fn => try self.functionDecl(),
2019-08-23 14:57:49 +00:00
.Identifier => try self.functionCall(),
else => blk: {
try self.doError("TODO handle {}\n", token.ttype);
return Result.CompileError;
},
2019-07-01 18:25:07 +00:00
};
return node;
2019-06-06 01:06:12 +00:00
}
2019-08-24 01:13:26 +00:00
fn parseFnDecl(self: *@This()) !?*Node {
var param_list = ast.ParamList.init(self.allocator);
errdefer param_list.deinit();
_ = try self.consumeSingle(.Fn);
2019-08-24 14:07:23 +00:00
const name = try self.consumeSingle(.Identifier);
_ = try self.consumeSingle(.LeftParen);
2019-08-23 18:52:04 +00:00
while (self.peek().ttype != .RightParen) {
const param_name = try self.consumeSingle(.Identifier);
const param_type = try self.consumeSingle(.Identifier);
2019-08-23 18:52:04 +00:00
try param_list.append(ast.ParamDecl{
.name = param_name,
.typ = param_type,
});
}
2019-08-23 18:52:04 +00:00
_ = try self.consumeSingle(.RightParen);
2019-08-23 18:52:04 +00:00
2019-08-24 01:13:26 +00:00
// TODO return type
2019-08-24 14:07:23 +00:00
const return_type = try self.consumeSingle(.Identifier);
2019-08-24 01:13:26 +00:00
var block = try self.parseBlock();
2019-08-23 18:52:04 +00:00
std.debug.warn("!fn name: {}\n", name);
2019-08-24 14:07:23 +00:00
return try self.mkFnDecl(name, param_list, block.Block);
}
2019-08-23 18:52:04 +00:00
2019-08-24 01:13:26 +00:00
fn parseConstDecl(self: *@This()) !?*Node {
var consts = ast.ConstList.init(self.allocator);
errdefer consts.deinit();
_ = try self.consumeSingle(.Const);
_ = try self.consumeSingle(.LeftParen);
while (self.peek().ttype != .RightParen) {
const const_name = try self.consumeSingle(.Identifier);
_ = try self.consumeSingle(.Equal);
2019-08-24 19:00:22 +00:00
var expr = try self.parseExpr();
// _ = try self.nextToken();
//const const_value = try self.consumeSingle(.Identifier);
2019-08-24 19:00:22 +00:00
try consts.append(ast.SingleConst{
.name = const_name,
.expr = expr.Expr,
});
}
_ = try self.consumeSingle(.RightParen);
return self.mkConstDecl(consts);
}
2019-08-24 01:13:26 +00:00
fn parseTopDecl(self: *@This()) !?*Node {
return switch (self.peek().ttype) {
2019-08-24 01:13:26 +00:00
.Fn => try self.parseFnDecl(),
.Const => try self.parseConstDecl(),
2019-08-23 18:52:04 +00:00
2019-08-23 14:57:49 +00:00
else => |ttype| blk: {
self.doError("(basic) expected fn/const, got {}\n", ttype);
2019-08-23 14:57:49 +00:00
break :blk null;
},
};
}
2019-08-24 14:07:23 +00:00
fn parseBlock(self: *@This()) !*Node {
2019-08-24 19:00:22 +00:00
var stmts = ast.StmtList.init(self.allocator);
errdefer stmts.deinit();
2019-06-06 01:06:12 +00:00
2019-08-24 14:07:23 +00:00
_ = try self.consumeSingle(.LeftBrace);
2019-08-24 14:07:23 +00:00
while (self.peek().ttype != .RightBrace) {
2019-08-24 19:00:22 +00:00
var node = try self.parseStmt();
2019-08-24 14:07:23 +00:00
ast.printNode(node, 0);
2019-08-24 19:00:22 +00:00
try stmts.append(node.Stmt);
2019-08-24 14:07:23 +00:00
}
2019-08-24 19:00:22 +00:00
2019-08-24 01:13:26 +00:00
_ = try self.consumeSingle(.RightBrace);
2019-08-24 19:00:22 +00:00
return try self.mkBlock(stmts);
}
fn parseStmt(self: *@This()) anyerror!*Node {
var stmt = switch (self.peek().ttype) {
.Println => try self.parsePrintln(),
// TODO make newlines tokens and consume newline?
else => try self.parseStmtExpr(),
};
return try self.mkStmt(stmt);
}
fn parsePrintln(self: *@This()) !*Stmt {
_ = try self.consumeSingle(.Println);
var expr = try self.parseExpr();
return try Stmt.mkPrintln(self.allocator, expr.Expr);
}
fn parseStmtExpr(self: *@This()) !*Stmt {
var expr = (try self.parseExpr()).Expr;
return try self.mkStmtExpr(expr);
2019-08-24 01:13:26 +00:00
}
2019-08-24 01:13:26 +00:00
fn parseExpr(self: *@This()) anyerror!*Node {
var expr = try self.parseEquality();
return self.mkExpr(expr);
}
fn parseEquality(self: *@This()) !*Expr {
var expr = try self.parseComparison();
while (self.peek().ttype == .EqualEqual) {
var op = self.peek();
_ = try self.nextToken();
2019-08-24 01:13:26 +00:00
var right = try self.parseComparison();
expr = try self.mkBinary(expr, op, right);
2019-08-23 14:57:49 +00:00
}
2019-08-24 01:13:26 +00:00
return expr;
}
fn parseComparison(self: *@This()) !*Expr {
var expr = try self.parseAddition();
while (self.compareAnyOf(&[_]TokenType{
.Greater,
.GreaterEqual,
.Less,
.LessEqual,
})) {
var op = self.peek();
_ = try self.nextToken();
2019-08-24 01:13:26 +00:00
var right = try self.parseAddition();
expr = try self.mkBinary(expr, op, right);
2019-06-06 01:06:12 +00:00
}
2019-08-24 01:13:26 +00:00
return expr;
}
fn parseAddition(self: *@This()) !*Expr {
var expr = try self.parseMultiplication();
while (self.compareAnyOf(&[_]TokenType{
.Minus, .Plus,
})) {
2019-08-24 14:07:23 +00:00
var op = self.peek();
_ = try self.nextToken();
2019-08-24 01:13:26 +00:00
var right = try self.parseMultiplication();
2019-08-24 14:07:23 +00:00
expr = try self.mkBinary(expr, op, right);
2019-08-24 01:13:26 +00:00
}
return expr;
}
fn parseMultiplication(self: *@This()) !*Expr {
var expr = try self.parseUnary();
while (self.compareAnyOf(&[_]TokenType{
.Star, .Slash,
})) {
var op = self.peek();
_ = try self.nextToken();
2019-08-24 01:13:26 +00:00
var right = try self.parseUnary();
expr = try self.mkBinary(expr, op, right);
2019-08-24 01:13:26 +00:00
}
return expr;
}
fn parseUnary(self: *@This()) anyerror!*Expr {
if (self.compareAnyOf(&[_]TokenType{ .Bang, .Minus })) {
var op = self.previous();
var right = try self.parseUnary();
return try self.mkUnary(op, right);
}
2019-08-24 14:07:23 +00:00
var expr = try self.parsePrimary();
return expr;
2019-08-24 01:13:26 +00:00
}
fn parsePrimary(self: *@This()) !*Expr {
const curtype = self.peek().ttype;
const lexeme = self.peek().lexeme;
2019-08-24 14:07:23 +00:00
var expr = switch (curtype) {
.False => try self.mkBool(false),
.True => try self.mkBool(true),
2019-08-24 01:13:26 +00:00
2019-08-24 14:07:23 +00:00
.Integer => try self.mkInteger(lexeme),
.Float => try self.mkFloat(lexeme),
.String => try self.mkString(lexeme),
2019-08-24 01:13:26 +00:00
.LeftParen => blk: {
2019-08-24 14:07:23 +00:00
_ = try self.nextToken();
2019-08-24 01:13:26 +00:00
var expr = (try self.parseExpr()).Expr;
_ = try self.consume(.RightParen, "Expected ')' after expression");
break :blk try self.mkGrouping(expr);
},
else => blk: {
self.doError("expected false/true/int/float/string/leftparen, got {}", curtype);
return Result.CompileError;
},
};
2019-08-24 14:07:23 +00:00
_ = try self.nextToken();
return expr;
2019-06-05 01:11:11 +00:00
}
};