2020-02-25 12:26:21 +01:00
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
import * as acorn from "acorn"
|
|
|
|
|
2020-02-25 12:26:21 +01:00
|
|
|
import {
|
|
|
|
Syntax,
|
|
|
|
Token,
|
|
|
|
FuncDecl,
|
|
|
|
Identifier,
|
|
|
|
SyntaxKind,
|
|
|
|
TokenStream,
|
|
|
|
RetStmt,
|
|
|
|
VarDecl,
|
|
|
|
Stmt,
|
|
|
|
Patt,
|
|
|
|
Expr,
|
|
|
|
BindPatt,
|
|
|
|
Param,
|
|
|
|
RefExpr,
|
|
|
|
TypeRef,
|
|
|
|
TypeDecl,
|
|
|
|
ConstExpr,
|
2020-02-25 17:55:17 +01:00
|
|
|
QualName,
|
|
|
|
ForeignDecl,
|
|
|
|
CallExpr,
|
2020-02-25 12:26:21 +01:00
|
|
|
} from "./ast"
|
|
|
|
|
|
|
|
function describeKind(kind: SyntaxKind): string {
|
|
|
|
switch (kind) {
|
|
|
|
case SyntaxKind.Identifier:
|
|
|
|
return "an identifier"
|
|
|
|
case SyntaxKind.Operator:
|
|
|
|
return "an operator"
|
2020-02-25 17:55:17 +01:00
|
|
|
case SyntaxKind.StringLiteral:
|
|
|
|
return "a string"
|
|
|
|
case SyntaxKind.IntegerLiteral:
|
|
|
|
return "an integer"
|
|
|
|
case SyntaxKind.FunctionKeyword:
|
|
|
|
return "'fn'"
|
|
|
|
case SyntaxKind.ForeignKeyword:
|
|
|
|
return "'foreign'"
|
|
|
|
case SyntaxKind.LetKeyword:
|
|
|
|
return "'let'"
|
2020-02-25 12:26:21 +01:00
|
|
|
case SyntaxKind.Semi:
|
|
|
|
return "';'"
|
|
|
|
case SyntaxKind.Colon:
|
|
|
|
return "':'"
|
|
|
|
case SyntaxKind.Dot:
|
|
|
|
return "'.'"
|
|
|
|
case SyntaxKind.Comma:
|
|
|
|
return "','"
|
|
|
|
case SyntaxKind.Braced:
|
|
|
|
return "'{' .. '}'"
|
|
|
|
case SyntaxKind.Bracketed:
|
|
|
|
return "'[' .. ']'"
|
|
|
|
case SyntaxKind.Parenthesized:
|
|
|
|
return "'(' .. ')'"
|
2020-02-25 17:55:17 +01:00
|
|
|
case SyntaxKind.EOS:
|
|
|
|
return "'}', ')', ']' or end-of-file"
|
2020-02-25 12:26:21 +01:00
|
|
|
default:
|
2020-02-25 17:55:17 +01:00
|
|
|
throw new Error(`failed to describe ${SyntaxKind[kind]}`)
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function enumerate(elements: string[]) {
|
|
|
|
if (elements.length === 1) {
|
|
|
|
return elements[0]
|
|
|
|
} else {
|
2020-02-25 17:55:17 +01:00
|
|
|
return elements.slice(0, elements.length-1).join(',') + ' or ' + elements[elements.length-1]
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
export class ParseError extends Error {
|
|
|
|
constructor(public actual: Token, public expected: SyntaxKind[]) {
|
2020-02-25 17:59:36 +01:00
|
|
|
super(`${actual.span.file.path}:${actual.span.start.line}:${actual.span.start.column}: expected ${enumerate(expected.map(e => describeKind(e)))} but got ${describeKind(actual.kind)}`)
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
export class Parser {
|
|
|
|
|
|
|
|
|
|
|
|
constructor() {
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
parseQualName(tokens: TokenStream) {
|
|
|
|
|
|
|
|
const path: Identifier[] = [];
|
|
|
|
|
|
|
|
while (true) {
|
|
|
|
const t0 = tokens.peek(2);
|
|
|
|
if (t0.kind !== SyntaxKind.Dot) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
path.push(tokens.get() as Identifier)
|
|
|
|
tokens.get();
|
|
|
|
}
|
|
|
|
|
|
|
|
const name = tokens.get();
|
|
|
|
if (name.kind !== SyntaxKind.Identifier) {
|
|
|
|
throw new ParseError(name, [SyntaxKind.Identifier]);
|
|
|
|
}
|
|
|
|
|
|
|
|
const startNode = path.length > 0 ? path[0] : name;
|
|
|
|
const endNode = name;
|
|
|
|
return new QualName(name, path, null, [startNode, endNode]);
|
|
|
|
}
|
|
|
|
|
|
|
|
parsePattern(tokens: TokenStream): Patt {
|
|
|
|
const t0 = tokens.peek(1);
|
|
|
|
if (t0.kind === SyntaxKind.Identifier) {
|
|
|
|
tokens.get();
|
|
|
|
return new BindPatt(t0, null, t0)
|
|
|
|
} else {
|
|
|
|
throw new ParseError(t0, [SyntaxKind.Identifier])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
parseTypeDecl(tokens: TokenStream): TypeDecl {
|
|
|
|
const t0 = tokens.peek();
|
|
|
|
if (t0.kind === SyntaxKind.Identifier) {
|
|
|
|
const name = this.parseQualName(tokens)
|
|
|
|
return new TypeRef(name, [], null, name.origNode)
|
|
|
|
} else {
|
|
|
|
throw new ParseError(t0, [SyntaxKind.Identifier]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
parsePrimExpr(tokens: TokenStream): Expr {
|
2020-02-25 12:26:21 +01:00
|
|
|
const t0 = tokens.peek();
|
2020-02-25 17:55:17 +01:00
|
|
|
if (t0.kind === SyntaxKind.StringLiteral) {
|
|
|
|
tokens.get();
|
2020-02-25 12:26:21 +01:00
|
|
|
return new ConstExpr(t0.value, null, t0);
|
|
|
|
} else if (t0.kind === SyntaxKind.Identifier) {
|
|
|
|
const name = this.parseQualName(tokens);
|
|
|
|
return new RefExpr(name, null, name.origNode);
|
|
|
|
} else {
|
2020-02-25 17:55:17 +01:00
|
|
|
throw new ParseError(t0, [SyntaxKind.StringLiteral, SyntaxKind.Identifier]);
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
parseExpr(tokens: TokenStream) {
|
|
|
|
return this.parsePrimExpr(tokens)
|
|
|
|
}
|
|
|
|
|
2020-02-25 12:26:21 +01:00
|
|
|
parseParam(tokens: TokenStream) {
|
|
|
|
|
|
|
|
let defaultValue = null;
|
|
|
|
let typeDecl = null;
|
|
|
|
|
|
|
|
const pattern = this.parsePattern(tokens)
|
|
|
|
|
|
|
|
const t0 = tokens.peek(1);
|
|
|
|
if (t0.kind === SyntaxKind.Colon) {
|
|
|
|
tokens.get();
|
|
|
|
typeDecl = this.parseTypeDecl(tokens);
|
|
|
|
const t1 = tokens.peek(1);
|
|
|
|
if (t1.kind === SyntaxKind.EqSign) {
|
|
|
|
tokens.get();
|
|
|
|
defaultValue = this.parseExpr(tokens);
|
|
|
|
}
|
|
|
|
} else if (t0.kind === SyntaxKind.EqSign) {
|
|
|
|
tokens.get();
|
|
|
|
defaultValue = this.parseExpr(tokens);
|
|
|
|
}
|
|
|
|
|
|
|
|
return new Param(pattern, typeDecl, defaultValue)
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
parseVarDecl(tokens: TokenStream): VarDecl {
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
// Assuming first token is 'let'
|
|
|
|
tokens.get();
|
|
|
|
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
parseRetStmt(tokens: TokenStream): RetStmt {
|
|
|
|
|
|
|
|
// Assuming first token is 'return'
|
|
|
|
const t0 = tokens.get();
|
|
|
|
|
|
|
|
let expr = null;
|
|
|
|
|
|
|
|
const t1 = tokens.peek();
|
|
|
|
if (t1.kind !== SyntaxKind.EOS) {
|
|
|
|
expr = this.parseExpr(tokens)
|
|
|
|
}
|
|
|
|
|
|
|
|
return new RetStmt(expr, null, [t0, expr.getEndNode()]);
|
|
|
|
}
|
|
|
|
|
|
|
|
parseStmts(tokens: TokenStream, origNode: Syntax | null): Stmt[] {
|
|
|
|
// TODO
|
|
|
|
return []
|
|
|
|
}
|
|
|
|
|
|
|
|
protected assertEmpty(tokens: TokenStream) {
|
|
|
|
const t0 = tokens.peek(1);
|
|
|
|
if (t0.kind !== SyntaxKind.EOS) {
|
|
|
|
throw new ParseError(t0, [SyntaxKind.EOS]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
parseFuncDecl(tokens: TokenStream, origNode: Syntax | null) {
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
let target = "Bolt";
|
|
|
|
|
|
|
|
const k0 = tokens.get();
|
|
|
|
if (k0.kind !== SyntaxKind.Identifier) {
|
|
|
|
throw new ParseError(k0, [SyntaxKind.ForeignKeyword, SyntaxKind.FunctionKeyword])
|
|
|
|
}
|
|
|
|
if (k0.text === 'foreign') {
|
|
|
|
const l1 = tokens.get();
|
|
|
|
if (l1.kind !== SyntaxKind.StringLiteral) {
|
|
|
|
throw new ParseError(l1, [SyntaxKind.StringLiteral])
|
|
|
|
}
|
|
|
|
target = l1.value;
|
|
|
|
}
|
|
|
|
const k1 = tokens.get();
|
|
|
|
if (k1.text !== 'fn') {
|
|
|
|
throw new ParseError(k1, [SyntaxKind.FunctionKeyword])
|
|
|
|
}
|
2020-02-25 12:26:21 +01:00
|
|
|
|
|
|
|
let name: QualName;
|
|
|
|
let returnType = null;
|
|
|
|
let body = null;
|
|
|
|
let params: Param[] = [];
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
// Parse parameters
|
|
|
|
|
2020-02-25 12:26:21 +01:00
|
|
|
const t0 = tokens.peek(1);
|
|
|
|
const t1 = tokens.peek(2);
|
|
|
|
|
|
|
|
const isParamLike = (token: Token) =>
|
|
|
|
token.kind === SyntaxKind.Identifier || token.kind === SyntaxKind.Parenthesized;
|
|
|
|
|
|
|
|
const parseParamLike = (tokens: TokenStream) => {
|
|
|
|
const t0 = tokens.peek(1);
|
|
|
|
if (t0.kind === SyntaxKind.Identifier) {
|
|
|
|
tokens.get();
|
|
|
|
return new Param(new BindPatt(t0, null, t0), null, null, null, t0)
|
|
|
|
} else if (t0.kind === SyntaxKind.Parenthesized) {
|
|
|
|
tokens.get();
|
2020-02-25 17:55:17 +01:00
|
|
|
const innerTokens = t0.toTokenStream();
|
2020-02-25 12:26:21 +01:00
|
|
|
const param = this.parseParam(innerTokens)
|
|
|
|
this.assertEmpty(innerTokens);
|
|
|
|
return param
|
|
|
|
} else {
|
|
|
|
throw new ParseError(t0, [SyntaxKind.Identifier, SyntaxKind.Parenthesized])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (t0.kind === SyntaxKind.Operator) {
|
|
|
|
|
|
|
|
name = new QualName(t0, [], null, t0);
|
|
|
|
tokens.get();
|
|
|
|
params.push(parseParamLike(tokens))
|
|
|
|
|
|
|
|
} else if (isParamLike(t0) && t1.kind == SyntaxKind.Operator) {
|
|
|
|
|
|
|
|
params.push(parseParamLike(tokens));
|
|
|
|
name = new QualName(t1, [], null, t1);
|
|
|
|
while (true) {
|
|
|
|
const t2 = tokens.peek();
|
|
|
|
if (t2.kind !== SyntaxKind.Operator) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (t2.text !== t1.text) {
|
|
|
|
throw new Error(`Operators have to match when defining or declaring an n-ary operator.`);
|
|
|
|
}
|
|
|
|
tokens.get();
|
|
|
|
params.push(parseParamLike(tokens))
|
|
|
|
}
|
|
|
|
|
|
|
|
} else if (t0.kind === SyntaxKind.Identifier) {
|
|
|
|
|
|
|
|
name = this.parseQualName(tokens)
|
|
|
|
const t2 = tokens.get();
|
|
|
|
if (t2.kind === SyntaxKind.Parenthesized) {
|
2020-02-25 17:55:17 +01:00
|
|
|
const innerTokens = t2.toTokenStream();
|
2020-02-25 12:26:21 +01:00
|
|
|
while (true) {
|
|
|
|
const t3 = innerTokens.peek();
|
|
|
|
if (t3.kind === SyntaxKind.EOS) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
params.push(this.parseParam(innerTokens))
|
|
|
|
const t4 = innerTokens.get();
|
|
|
|
if (t4.kind === SyntaxKind.Comma) {
|
|
|
|
continue;
|
|
|
|
} else if (t4.kind === SyntaxKind.EOS) {
|
|
|
|
break;
|
|
|
|
} else {
|
|
|
|
throw new ParseError(t4, [SyntaxKind.Comma, SyntaxKind.EOS])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
} else {
|
|
|
|
|
|
|
|
throw new ParseError(t0, [SyntaxKind.Identifier, SyntaxKind.Operator, SyntaxKind.Parenthesized])
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
// Parse return type
|
|
|
|
|
|
|
|
const t2 = tokens.peek();
|
|
|
|
if (t2.kind === SyntaxKind.RArrow) {
|
|
|
|
tokens.get();
|
2020-02-25 17:55:17 +01:00
|
|
|
returnType = this.parseTypeDecl(tokens);
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Parse function body
|
|
|
|
|
|
|
|
const t3 = tokens.peek();
|
|
|
|
if (t3.kind === SyntaxKind.Braced) {
|
2020-02-25 17:55:17 +01:00
|
|
|
tokens.get();
|
|
|
|
switch (target) {
|
|
|
|
case "Bolt":
|
|
|
|
body = this.parseStmts(tokens, t3);
|
|
|
|
break;
|
|
|
|
case "JS":
|
|
|
|
body = acorn.parse(t3.text).body;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
throw new Error(`Unrecognised language: ${target}`);
|
|
|
|
}
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
return new FuncDecl(target, name, params, returnType, body, null, origNode)
|
2020-02-25 12:26:21 +01:00
|
|
|
|
|
|
|
}
|
|
|
|
|
2020-02-25 17:55:17 +01:00
|
|
|
parseCallExpr(tokens: TokenStream) {
|
|
|
|
|
|
|
|
const operator = this.parsePrimExpr(tokens)
|
|
|
|
const args: Expr[] = []
|
|
|
|
|
|
|
|
const t2 = tokens.get();
|
|
|
|
if (t2.kind !== SyntaxKind.Parenthesized) {
|
|
|
|
throw new ParseError(t2, [SyntaxKind.Parenthesized])
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
2020-02-25 17:55:17 +01:00
|
|
|
|
|
|
|
const innerTokens = t2.toTokenStream();
|
|
|
|
|
|
|
|
while (true) {
|
|
|
|
const t3 = innerTokens.peek();
|
|
|
|
if (t3.kind === SyntaxKind.EOS) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
args.push(this.parseExpr(innerTokens))
|
|
|
|
const t4 = innerTokens.get();
|
|
|
|
if (t4.kind === SyntaxKind.EOS) {
|
|
|
|
break
|
|
|
|
} else if (t4.kind !== SyntaxKind.Comma){
|
|
|
|
throw new ParseError(t4, [SyntaxKind.Comma])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return new CallExpr(operator, args, null)
|
|
|
|
|
2020-02-25 12:26:21 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|