Files
jack-compiler/internal/compilation-engine/compilation-engine.go
T

649 lines
18 KiB
Go

package engine
import (
"errors"
"slices"
"strings"
"github.com/hazemKrimi/jack-compiler/internal/tokenizer"
)
func WriteToken(output *strings.Builder, token tokenizer.Token, index *int) error {
if _, err := output.WriteString("<" + token.XML + "> " + token.Value + " </" + token.XML + ">\n"); err != nil {
return err
}
(*index)++
return nil
}
func compileClassVarDec(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || !slices.Contains([]string{"static", "field"}, tokens[*index].Value) {
return nil
}
output.WriteString("<classVarDec>\n")
WriteToken(output, tokens[*index], index)
if !slices.Contains([]tokenizer.TokenType{tokenizer.KEYWORD, tokenizer.IDENTIFIER}, tokens[*index].Type) && !slices.Contains([]string{"int", "char", "boolean"}, tokens[*index].Value) {
return errors.New("Invalid variable type name!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
for tokens[*index].Type == tokenizer.SYMBOL && tokens[*index].Value == "," {
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ";" {
return errors.New("Missing semicolon!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</classVarDec>\n")
return compileClassVarDec(output, tokens, index)
}
func compileParameterList(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if !slices.Contains([]tokenizer.TokenType{tokenizer.KEYWORD, tokenizer.IDENTIFIER}, tokens[*index].Type) || !slices.Contains([]string{"int", "char", "boolean"}, tokens[*index].Value) {
return nil
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type == tokenizer.SYMBOL && tokens[*index].Value == "," {
WriteToken(output, tokens[*index], index)
return compileParameterList(output, tokens, index)
}
return nil
}
func compileVariableDeclaration(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || tokens[*index].Value != "var" {
return nil
}
output.WriteString("<varDec>\n")
WriteToken(output, tokens[*index], index)
if !slices.Contains([]tokenizer.TokenType{tokenizer.KEYWORD, tokenizer.IDENTIFIER}, tokens[*index].Type) && !slices.Contains([]string{"int", "char", "boolean"}, tokens[*index].Value) {
return errors.New("Invalid variable type name!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
for tokens[*index].Type == tokenizer.SYMBOL && tokens[*index].Value == "," {
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ";" {
return errors.New("Missing semicolon!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</varDec>\n")
return compileVariableDeclaration(output, tokens, index)
}
func compileSubroutineCall(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Value == "." {
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid subroutine name!")
}
WriteToken(output, tokens[*index], index)
}
if tokens[*index].Value != "(" {
return errors.New("Missing subroutine call opening parenthese!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("<expressionList>\n")
if err := compileExpressionList(output, tokens, index); err != nil {
return err
}
output.WriteString("</expressionList>\n")
if tokens[*index].Value != ")" {
return errors.New("Missing subroutine call closing parenthese!")
}
WriteToken(output, tokens[*index], index)
return nil
}
func compileTerm(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
output.WriteString("<term>\n")
if tokens[*index].Type == tokenizer.SYMBOL && slices.Contains([]string{"-", "~"}, tokens[*index].Value) {
WriteToken(output, tokens[*index], index)
if err := compileTerm(output, tokens, index); err != nil {
return err
}
output.WriteString("</term>\n")
return nil
}
if slices.Contains([]tokenizer.TokenType{tokenizer.INT_CONST, tokenizer.STR_CONST}, tokens[*index].Type) || slices.Contains([]string{"true", "false", "null", "this"}, tokens[*index].Value) {
WriteToken(output, tokens[*index], index)
output.WriteString("</term>\n")
return nil
}
if tokens[*index].Type == tokenizer.SYMBOL && tokens[*index].Value == "(" {
WriteToken(output, tokens[*index], index)
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ")" {
return errors.New("Invalid term!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</term>\n")
return nil
}
if tokens[*index].Type == tokenizer.IDENTIFIER {
WriteToken(output, tokens[*index], index)
if tokens[*index].Value == "[" {
WriteToken(output, tokens[*index], index)
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "]" {
return errors.New("Invalid term!")
}
WriteToken(output, tokens[*index], index)
} else if slices.Contains([]string{"(", "."}, tokens[*index].Value) {
if err := compileSubroutineCall(output, tokens, index); err != nil {
return err
}
}
output.WriteString("</term>\n")
}
return nil
}
func compileExpression(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
output.WriteString("<expression>\n")
if err := compileTerm(output, tokens, index); err != nil {
return err
}
if slices.Contains([]string{"+", "-", "*", "/", "&amp;", "|", "&lt;", "&gt;", "="}, tokens[*index].Value) {
WriteToken(output, tokens[*index], index)
if err := compileTerm(output, tokens, index); err != nil {
return err
}
}
output.WriteString("</expression>\n")
return nil
}
func compileExpressionList(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if slices.Contains([]tokenizer.TokenType{tokenizer.IDENTIFIER, tokenizer.INT_CONST, tokenizer.STR_CONST}, tokens[*index].Type) || slices.Contains([]string{"true", "false", "null", "this", "~", "-", "("}, tokens[*index].Value) {
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type == tokenizer.SYMBOL && tokens[*index].Value == "," {
WriteToken(output, tokens[*index], index)
return compileExpressionList(output, tokens, index)
}
}
return nil
}
func compileLetStatement(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || tokens[*index].Value != "let" {
return errors.New("Invalid let statement!")
}
output.WriteString("<letStatement>\n")
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Value == "[" {
WriteToken(output, tokens[*index], index)
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "]" {
return errors.New("Invalid expression!")
}
WriteToken(output, tokens[*index], index)
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "=" {
return errors.New("Missing assignment!")
}
WriteToken(output, tokens[*index], index)
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ";" {
return errors.New("Missing semicolon!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</letStatement>\n")
return nil
}
func compileIfStatement(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || tokens[*index].Value != "if" {
return errors.New("Invalid if statement!")
}
output.WriteString("<ifStatement>\n")
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "(" {
return errors.New("Missing if statement opening parenthese!")
}
WriteToken(output, tokens[*index], index)
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ")" {
return errors.New("Missing if statement closing parenthese!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "{" {
return errors.New("Missing if statement opening curly brace!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("<statements>\n")
if err := compileStatements(output, tokens, index); err != nil {
return err
}
output.WriteString("</statements>\n")
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "}" {
return errors.New("Missing if statement closing curly brace!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type == tokenizer.KEYWORD && tokens[*index].Value == "else" {
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "{" {
return errors.New("Missing if statement opening curly brace!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("<statements>\n")
if err := compileStatements(output, tokens, index); err != nil {
return err
}
output.WriteString("</statements>\n")
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "}" {
return errors.New("Missing if statement closing curly brace!")
}
WriteToken(output, tokens[*index], index)
}
output.WriteString("</ifStatement>\n")
return nil
}
func compileWhileStatement(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || tokens[*index].Value != "while" {
return errors.New("Invalid while statement!")
}
output.WriteString("<whileStatement>\n")
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "(" {
return errors.New("Missing while statement opening parenthese!")
}
WriteToken(output, tokens[*index], index)
if err := compileExpression(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ")" {
return errors.New("Missing while statement closing parenthese!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "{" {
return errors.New("Missing while statement opening curly brace!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("<statements>\n")
if err := compileStatements(output, tokens, index); err != nil {
return err
}
output.WriteString("</statements>\n")
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "}" {
return errors.New("Missing while statement closing curly brace!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</whileStatement>\n")
return nil
}
func compileDoStatement(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || tokens[*index].Value != "do" {
return errors.New("Invalid do statement!")
}
output.WriteString("<doStatement>\n")
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid variable name!")
}
WriteToken(output, tokens[*index], index)
if err := compileSubroutineCall(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ";" {
return errors.New("Missing semicolon!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</doStatement>\n")
return nil
}
func compileReturnStatement(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || tokens[*index].Value != "return" {
return errors.New("Invalid return statement!")
}
output.WriteString("<returnStatement>\n")
WriteToken(output, tokens[*index], index)
if slices.Contains([]tokenizer.TokenType{tokenizer.KEYWORD, tokenizer.IDENTIFIER, tokenizer.INT_CONST, tokenizer.STR_CONST}, tokens[*index].Type) {
if err := compileExpression(output, tokens, index); err != nil {
return err
}
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ";" {
return errors.New("Missing semicolon!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</returnStatement>\n")
return nil
}
func compileStatements(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD {
return nil
}
switch tokens[*index].Value {
case "let":
if err := compileLetStatement(output, tokens, index); err != nil {
return err
}
case "if":
if err := compileIfStatement(output, tokens, index); err != nil {
return err
}
case "while":
if err := compileWhileStatement(output, tokens, index); err != nil {
return err
}
case "do":
if err := compileDoStatement(output, tokens, index); err != nil {
return err
}
case "return":
if err := compileReturnStatement(output, tokens, index); err != nil {
return err
}
default:
return errors.New("Invalid statement!")
}
return compileStatements(output, tokens, index)
}
func compileSubroutineBody(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type == tokenizer.KEYWORD && tokens[*index].Value == "var" {
if err := compileVariableDeclaration(output, tokens, index); err != nil {
return err
}
}
output.WriteString("<statements>\n")
if err := compileStatements(output, tokens, index); err != nil {
return err
}
output.WriteString("</statements>\n")
return nil
}
func compileSubroutineDeclaration(output *strings.Builder, tokens []tokenizer.Token, index *int) error {
if tokens[*index].Type != tokenizer.KEYWORD || !slices.Contains([]string{"constructor", "method", "function"}, tokens[*index].Value) {
return nil
}
output.WriteString("<subroutineDec>\n")
WriteToken(output, tokens[*index], index)
if !slices.Contains([]tokenizer.TokenType{tokenizer.KEYWORD, tokenizer.IDENTIFIER}, tokens[*index].Type) && !slices.Contains([]string{"void", "int", "char", "boolean"}, tokens[*index].Value) {
return errors.New("Invalid subroutine return type!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid subroutine name!")
}
WriteToken(output, tokens[*index], index)
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "(" {
return errors.New("Missing subroutine opening parenthese!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("<parameterList>\n")
if err := compileParameterList(output, tokens, index); err != nil {
return err
}
output.WriteString("</parameterList>\n")
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != ")" {
return errors.New("Missing subroutine closing parenthese!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("<subroutineBody>\n")
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "{" {
return errors.New("Missing subroutine opening curly brace!")
}
WriteToken(output, tokens[*index], index)
if err := compileSubroutineBody(output, tokens, index); err != nil {
return err
}
if tokens[*index].Type != tokenizer.SYMBOL || tokens[*index].Value != "}" {
return errors.New("Missing subroutine closing curly brace!")
}
WriteToken(output, tokens[*index], index)
output.WriteString("</subroutineBody>\n")
output.WriteString("</subroutineDec>\n")
return compileSubroutineDeclaration(output, tokens, index)
}
func compileClass(output *strings.Builder, tokens []tokenizer.Token) error {
index := 0
output.WriteString("<class>\n")
if tokens[index].Type != tokenizer.KEYWORD || tokens[index].Value != "class" {
return errors.New("Jack file must contain one class!")
}
WriteToken(output, tokens[index], &index)
if tokens[index].Type != tokenizer.IDENTIFIER {
return errors.New("Invalid class name!")
}
WriteToken(output, tokens[index], &index)
if tokens[index].Type != tokenizer.SYMBOL || tokens[index].Value != "{" {
return errors.New("Missing class opening curly brace!")
}
WriteToken(output, tokens[index], &index)
if err := compileClassVarDec(output, tokens, &index); err != nil {
return err
}
if err := compileSubroutineDeclaration(output, tokens, &index); err != nil {
return err
}
if tokens[index].Type != tokenizer.SYMBOL || tokens[index].Value != "}" {
return errors.New("Missing class closing curly brace!")
}
WriteToken(output, tokens[index], &index)
output.WriteString("</class>\n")
return nil
}
func Compile(tokens []tokenizer.Token) (string, error) {
var output strings.Builder
if err := compileClass(&output, tokens); err != nil {
return "", err
}
return output.String(), nil
}