/* NOTE: do not allow concatenation of commands! Operators ; - When used by PRINT and INPUT, concatenates two printables; numbers will have one space between them while strings will not. , - Function argument separator + - Just as in JS; concatenates two strings */ var vmemsize = system.maxmem() - 5236; var cmdbuf = []; // index: line number var cmdbufMemFootPrint = 0; var prompt = "Ok"; var lang = {}; lang.syntaxfehler = function(line) { if (line === undefined) return "Syntax error"; return "Syntax error in " + line; }; function getUsedMemSize() { return cmdbufMemFootPrint; // + array's dimsize * 8 + variables' sizeof literal + functions' expression length } var reLineNum = /^[0-9]+ +[^0-9]/; //var reFloat = /^([\-+]?[0-9]*[.][0-9]+[eE]*[\-+0-9]*[fF]*|[\-+]?[0-9]+[.eEfF][0-9+\-]*[fF]?)$/; //var reDec = /^([\-+]?[0-9_]+)$/; //var reHex = /^(0[Xx][0-9A-Fa-f_]+)$/; //var reBin = /^(0[Bb][01_]+)$/; // must match partial var reNumber = /([0-9]*[.][0-9]+[eE]*[\-+0-9]*[fF]*|[0-9]+[.eEfF][0-9+\-]*[fF]?)|([0-9_]+)|(0[Xx][0-9A-Fa-f_]+)|(0[Bb][01_]+)/g; var reOps = /\^|\*|\/|\+|\-|[<>=]{1,2}/g; var reNum = /[0-9]+/; var tbasexit = false; println("Terran BASIC 1.0 "+vmemsize+" bytes free"); println(prompt); var basicInterpreterStatus = {}; // variable object constructor function BasicVar(linenum, literal, type) { this.literal = literal; this.type = type; } // DEFUN (GW-BASIC equiv. of DEF FN) constructor function BasicFun(linenum, params, expression) { this.params = params; this.expression = expression; } // DIM (array) constructor function BasicArr() { var args = Array.from(arguments); if (args.length == 1) throw lang.syntaxfehler(args[0]); else if (args.length == 0) throw "InternalError: pass the line number!"; else { // create nested array as defined var dimsize = Number(args[1]); var a = new Array(args[1]); var internal = a; for (var i = 2; i < args.length; i++) { dimsize *= Number(args[i]); var inner = new Array(args[i]); internal.push(inner); internal = inner; } this.array = a; this.dimsize = dimsize; } } // Abstract Syntax Tree // creates empty tree node function BasicAST() { this.lnum = 0; this.depth = 0; this.leaves = []; this.value = undefined; this.type = "null"; // literal, operator, variable, function, null this.toString = function() { var sb = ""; var marker = ("literal" == this.type) ? ">" : ("operator" == this.type) ? "=" : "#"; sb += "| ".repeat(this.depth) + marker+" Line "+this.lnum+" ("+this.type+")\n"; sb += "| ".repeat(this.depth+1) + "leaves: "+(this.leaves.length)+"\n"; sb += "| ".repeat(this.depth+1) + "value: "+this.value+"\n"; for (var k = 0; k < this.leaves.length; k++) { sb += this.leaves[k].toString(); + "\n"; } sb += "| ".repeat(this.depth+1) + "----------------\n"; return sb; }; } basicInterpreterStatus.gosubStack = []; basicInterpreterStatus.variables = {}; basicInterpreterStatus.defuns = {}; basicInterpreterStatus.builtin = {}; basicInterpreterStatus.builtin.print = function() { var args = Array.from(arguments); if (args.length == 0) println(); else println(args.join("\t")); }; Object.freeze(basicInterpreterStatus.builtin); var basicFunctions = {}; basicFunctions._isNumber = function(code) { return (code >= 0x30 && code <= 0x39) || code == 0x2E; }; basicFunctions._isParenOpen = function(code) { return (code == 0x28 || code == 0x5B); }; basicFunctions._isParenClose = function(code) { return (code == 0x29 || code == 0x5D); }; basicFunctions._isParen = function(code) { return basicFunctions._isParenOpen(code) || basicFunctions._isParenClose(code); }; basicFunctions._isSeparator = function(code) { return code == 0x2C; }; basicFunctions._operatorPrecedence = { // function call in itself has highest precedence "^":13, "POSITIVE":12,"NEGATIVE":12,"NOT":12, "*":11,"/":11, "MOD":10, "+":9,"-":9, "<<":8,">>":8, "==":7,"<>":7,"><":7,"!=":7,"<":7,">":7,"<=":7,"=<":7,">=":7,"=>":7, "BAND":6, "BXOR":5, "BOR":4, "AND":3, "OR":2, "=":1 }; basicFunctions._isOperatorWord = function(word) { return (basicFunctions._operatorPrecedence[word] !== undefined) // force the return type to be a boolean }; basicFunctions._keywords = { }; basicFunctions._parseTokens = function(lnum, tokens, states, recDepth) { // DO NOT PERFORM SEMANTIC ANALYSIS HERE // at this point you can't (and shouldn't) distinguish whether or not defuns/variables are previously declared // a line has one of these forms: // VARIABLE = LITERAL // VARIABLE = FUNCTION ARGUMENTS // FUNCTION // FUNCTION ARGUMENTS --arguments may contain another function call // "FOR" VARIABLE "=" ARGUMENT "TO" ARGUMENT // "FOR" VARIABLE "=" ARGUMENT "TO" ARGUMENT "STEP" ARGUMENT // "IF" EXPRESSION "THEN" EXPRESSION // "IF" EXPRESSION "THEN" EXPRESSION "ELSE" EXPRESSION // "IF" EXPRESSION "GOTO" ARGUMENT // "IF" EXPRESSION "GOTO" ARGUMENT "ELSE" EXPRESSION // "WHILE" EXPRESSION // additionally, sub-line also has one of these: // LITERAL (leaf node) // VARIABLE (leaf node) // {VARIABLE, LITERAL} COMPARISON_OP {VARIABLE, LITERAL} println("Parser Ln "+lnum+", Rec "+recDepth+", Tkn: "+tokens.join("/")); if (tokens.length != states.length) throw "InternalError: size of tokens and states does not match (line: "+lnum+", recursion depth: "+recDepth+")"; if (tokens.length == 0) throw "InternalError: empty tokens (line: "+lnum+", recursion depth: "+recDepth+")"; var k; var headWord = tokens[0].toLowerCase(); var treeHead = new BasicAST(); treeHead.depth = recDepth; treeHead.lnum = lnum; // TODO ability to parse arbitrary parentheses // test string: print((minus(plus(3,2),times(8,7)))) // ^ ^ these extra parens break your parser // IF statement if ("IF" == tokens[0].toUpperCase()) { throw "TODO"; } // LEAF: is this a literal? else if (recDepth > 0 && ("quote" == states[0] || "number" == states[0])) { treeHead.value = tokens[0]; treeHead.type = "literal"; } // is this a function? else { // find and mark position of separators and parentheses // properly deal with the nested function calls var currentFunction = (states[0] == "paren") ? undefined : tokens[0]; var parenDepth = 0; var parenStart = 0; var parenEnd = -1; var separators = []; treeHead.value = currentFunction; treeHead.type = (currentFunction === undefined) ? "null" : "function"; for (k = 0; k < tokens.length; k++) { if (tokens[k] == "(") { parenDepth += 1; if (parenDepth == 1) parenStart = k; } else if (tokens[k] == ")") { if (parenDepth == 1) parenEnd = k; parenDepth -= 1; } if (parenDepth == 1 && states[k] == "sep") { separators.push(k); } } if (parenDepth != 0) throw "Unmatched brackets"; var leaves = []; // if there is no paren if (parenStart == 0 && parenEnd == -1 && tokens.length > 1) { var subtkn = tokens.slice(1, tokens.length); var substa = states.slice(1, tokens.length); leaves.push(basicFunctions._parseTokens(lnum, subtkn, substa, recDepth + 1)); } else if (parenEnd > parenStart) { separators = [parenStart].concat(separators, [parenEnd]); // recursively parse comma-separated arguments // print ( plus ( 3 , 2 ) , times ( 8 , 7 ) ) // s ^ e // separators = [1,8,15] // plus ( 3 , 2 ) / times ( 8 , 7 ) // s ^ e s ^ e // separators = [1,5] ; [1,5] // 3 / 2 / 8 / 7 for (k = 1; k < separators.length; k++) { var subtkn = tokens.slice(separators[k - 1] + 1, separators[k]); var substa = states.slice(separators[k - 1] + 1, separators[k]); leaves.push(basicFunctions._parseTokens(lnum, subtkn, substa, recDepth + 1)); } } treeHead.leaves = leaves; } return treeHead; }; // @returns: line number for the next command, normally (lnum + 1); if GOTO or GOSUB was met, returns its line number basicFunctions._interpretLine = function(lnum, cmd) { var k; var _debugprintStateTransition = false; var tokens = []; var states = []; var sb = ""; var mode = "literal"; // literal, escape, quote, quote_end, paren, sep, limbo; additionally: number, bool, operator if (_debugprintStateTransition) println("Ln "+lnum+" cmd "+cmd); // TOKENISE for (k = 0; k < cmd.length; k++) { var char = cmd[k]; var charCode = cmd.charCodeAt(k); if (_debugprintStateTransition) print("Char: "+char+"("+charCode+"), state: "+mode); if ("literal" == mode) { if (0x22 == charCode) { // " tokens.push(sb); sb = ""; states.push(mode); mode = "quote"; } /*else if (charCode == 0x5C) { // reverse solidus tokens.push(sb); sb = ""; mode = "escape"; }*/ else if (basicFunctions._isParen(charCode)) { tokens.push(sb); sb = "" + char; states.push(mode); mode = "paren"; } else if (" " == char) { tokens.push(sb); sb = ""; states.push(mode); mode = "limbo"; } else if (basicFunctions._isSeparator(charCode)) { tokens.push(sb); sb = "" + char; states.push(mode); mode = "sep"; } else { sb += char; } } else if ("escape" == mode) { if (0x5C == charCode) // reverse solidus sb += String.fromCharCode(0x5C); else if ("n" == char) sb += String.fromCharCode(0x0A); else if ("t" == char) sb += String.fromCharCode(0x09); else if (0x22 == charCode) // " sb += String.fromCharCode(0x22); else if (0x27 == charCode) sb += String.fromCharCode(0x27); else if ("e" == char) sb += String.fromCharCode(0x1B); else if ("a" == char) sb += String.fromCharCode(0x07); else if ("b" == char) sb += String.fromCharCode(0x08); mode = "quote"; // ESCAPE is only legal when used inside of quote } else if ("quote" == mode) { if (0x22 == charCode) { tokens.push(sb); sb = ""; states.push(mode); mode = "quote_end"; } else { sb += char; } } else if ("quote_end" == mode) { if (" " == char) { sb = ""; mode = "limbo"; } else if (0x22 == charCode) { sb = "" + char; mode = "quote"; } else if (basicFunctions._isParen(charCode)) { sb = "" + char; mode = "paren"; } else if (basicFunctions._isSeparator(charCode)) { sb = "" + char; mode = "sep"; } else { sb = "" + char; mode = "literal"; } } else if ("limbo" == mode) { if (char == " ") { /* do nothing */ } else if (0x22 == charCode) { sb = ""; mode = "quote" } else if (basicFunctions._isParen(charCode)) { sb = ""; mode = "paren"; } else if (basicFunctions._isSeparator(charCode)) { sb = ""; mode = "sep"; } else { sb = "" + char; mode = "literal"; } } else if ("paren" == mode) { if (char == " ") { tokens.push(sb); sb = ""; states.push(mode); mode = "limbo"; } else if (0x22 == charCode) { tokens.push(sb); sb = ""; states.push(mode); mode = "quote" } else if (basicFunctions._isParen(charCode)) { tokens.push(sb); sb = "" + char; states.push(mode); mode = "paren"; } else if (basicFunctions._isSeparator(charCode)) { tokens.push(sb); sb = "" + char; states.push(mode); mode = "sep"; } else { tokens.push(sb); sb = "" + char; states.push(mode); mode = "literal"; } } else if ("sep" == mode) { if (char == " ") { tokens.push(sb); sb = ""; states.push(mode); mode = "limbo"; } else if (0x22 == charCode) { tokens.push(sb); sb = ""; states.push(mode); mode = "quote" } else if (basicFunctions._isParen(charCode)) { tokens.push(sb); sb = "" + char; states.push(mode); mode = "paren"; } else if (basicFunctions._isSeparator(charCode)) { tokens.push(sb); sb = "" + char; states.push(mode); mode = "sep"; } else { tokens.push(sb); sb = "" + char; states.push(mode); mode = "literal"; } } else { throw "Unknown parser state: " + mode; } if (_debugprintStateTransition) println("->"+mode); } if (sb.length > 0) { tokens.push(sb); states.push(mode); } if (tokens.length != states.length) throw "InternalError: size of tokens and states does not match (line: "+lnum+")"; // END TOKENISE // ELABORATION : distinguish numbers and operators from literals k = 0; while (k < states.length) { // using while loop because array size will change during the execution serial.println("k="+k+" of "+states.length); if ("quote" == states[k] | "paren" == states[k]) { k += 1; continue; } if ("REM" == tokens[0].toUpperCase()) break; // if the tokeniser worked as intended, anything left would be one of those: // compound of numbers and operators // a number // an operator println("token="+tokens[k]+", type="+typeof tokens[k]); var reMatchNumbers = []; while (true) { var match = reNumber.exec(tokens[k]); if (match === null) break; reMatchNumbers.push(match); } var reMatchOps = []; while (true) { var match = reOps.exec(tokens[k]); if (match === null) break; reMatchOps.push(match); } if (reMatchOps[0] === undefined && reMatchNumbers[0] === undefined) ;/* do nothing */ else if (reMatchOps[0] === undefined) states[k] = "number"; else if (reMatchNumbers[0] === undefined) states[k] = "operators"; else { // this is where the fun begins reMatchNumbers = reMatchNumbers.map(function(it) { return it[0]; }); reMatchOps = reMatchOps.map(function(it) { return it[0]; }); var midTokens = []; var midStates = []; var tokenReadCursor = 0; var numMatchCursor = 0; var opsMatchCursor = 0; serial.println("token="+tokens[k]); serial.println("state="+states[k]); serial.println("reMatchNumbers="+reMatchNumbers.join(",")); serial.println("reMatchOps="+reMatchOps.join(",")); while (tokenReadCursor < tokens[k].length) { serial.println("c="+tokenReadCursor+",n="+numMatchCursor+",o="+opsMatchCursor); if (reMatchOps[opsMatchCursor] !== undefined && tokens[k][tokenReadCursor] === reMatchOps[opsMatchCursor][0]) { midTokens.push(reMatchOps[opsMatchCursor]); midStates.push("operators"); tokenReadCursor += reMatchOps[opsMatchCursor].length; opsMatchCursor += 1; } else if (reMatchNumbers[numMatchCursor] !== undefined && tokens[k][tokenReadCursor] === reMatchNumbers[numMatchCursor][0]) { midTokens.push(reMatchNumbers[numMatchCursor]); midStates.push("numbers"); tokenReadCursor += reMatchNumbers[numMatchCursor].length; numMatchCursor += 1; } else { throw "InternalError: c="+tokenReadCursor+",n="+numMatchCursor+",o="+opsMatchCursor+"\n"+ "reMatchNumbers="+reMatchNumbers.join(",")+"\n"+ "reMatchOps="+reMatchOps.join(","); } } tokens = [].concat(tokens.slice(0, k), midTokens, tokens.slice(k + 1, tokens.length)); states = [].concat(states.slice(0, k), midStates, states.slice(k + 1, states.length)); k += (midTokens.length - 1); } k += 1; } // END ELABORATION // PARSING (SYNTAX ANALYSIS) var syntaxTree = basicFunctions._parseTokens(lnum, tokens, states, 0); println("k bye"); serial.println(syntaxTree.toString()); // END PARSING println(tokens.join("~")); println(states.join(" ")); return lnum + 1; }; // end INTERPRETLINE basicFunctions._basicList = function(v, i, arr) { if (i < 10) print(" "); if (i < 100) print(" "); print(i); print(" "); println(v); }; basicFunctions.list = function(args) { // LIST function if (args.length == 1) { cmdbuf.forEach(basicFunctions._basicList); } else if (args.length == 2) { if (cmdbuf[args[1]] !== undefined) basicFunctions._basicList(cmdbuf[args[1]], args[1], undefined); } else { var lastIndex = (args[2] === ".") ? cmdbuf.length - 1 : (args[2] | 0); var i = 0; for (i = args[1]; i <= lastIndex; i++) { var cmd = cmdbuf[i]; if (cmd !== undefined) { basicFunctions._basicList(cmd, i, cmdbuf); } } } }; basicFunctions.system = function(args) { // SYSTEM function tbasexit = true; }; basicFunctions.new = function(args) { // NEW function cmdbuf = []; }; basicFunctions.renum = function(args) { // RENUM function var newcmdbuf = []; var linenumRelation = [[]]; var cnt = 10; for (var k = 0; k < cmdbuf.length; k++) { if (cmdbuf[k] !== undefined) { newcmdbuf[cnt] = cmdbuf[k]; linenumRelation[k] = cnt; cnt += 10; } } // deal with goto/gosub line numbers for (k = 0; k < newcmdbuf.length; k++) { if (newcmdbuf[k] !== undefined && newcmdbuf[k].toLowerCase().startsWith("goto ")) { newcmdbuf[k] = "goto " + linenumRelation[newcmdbuf[k].match(reNum)[0]]; } else if (newcmdbuf[k] !== undefined && newcmdbuf[k].toLowerCase().startsWith("gosub ")) { newcmdbuf[k] = "gosub " + linenumRelation[newcmdbuf[k].match(reNum)[0]]; } } cmdbuf = newcmdbuf.slice(); // make shallow copy // recalculate memory footprint cmdbufMemFootPrint = 0; cmdbuf.forEach(function(v, i, arr) { cmdbufMemFootPrint += ("" + i).length + 1 + v.length; }); }; basicFunctions.fre = function(args) { println(vmemsize - getUsedMemSize()); }; basicFunctions.run = function(args) { // RUN function var linenumber = 1; var oldnum = 1; do { if (cmdbuf[linenumber] !== undefined) { oldnum = linenumber; linenumber = basicFunctions._interpretLine(linenumber, cmdbuf[linenumber]); } else { linenumber += 1; } if (con.hitterminate()) { println("Break in "+oldnum); break; } } while (linenumber < cmdbuf.length) }; Object.freeze(basicFunctions); while (!tbasexit) { var line = sys.read(); line = line.trim(); cmdbufMemFootPrint += line.length; if (reLineNum.test(line)) { var i = line.indexOf(" "); cmdbuf[line.slice(0, i)] = line.slice(i + 1, line.length); } else if (line.length > 0) { cmdbufMemFootPrint -= line.length; try { var cmd = line.split(" "); basicFunctions[cmd[0]](cmd); } catch (e) { println(e); println(lang.syntaxfehler()); } println(prompt); } } /* digraph G { start -> LITERAL start -> LINENUMBER [label="reDec"] LINENUMBER -> LINENUMBER [label="numbers"] LINENUMBER -> limbo [label="space"] LINENUMBER -> LITERAL [label="otherwise"] LITERAL -> limbo [label="space"] LITERAL -> OPERATOR [label="reOps"] LITERAL -> ESCAPE [label="\\"] LITERAL -> QUOTE [label="\""] LITERAL -> PAREN [label="()[]"] LITERAL -> SEP [label=","] LITERAL -> LITERAL [label="otherwise"] limbo -> NUMBER [label="numbers"] limbo -> OPERATOR [label="reOps"] limbo -> QUOTE [label="\""] limbo -> LITERAL [label="otherwise"] limbo -> PAREN [label="()[]"] limbo -> SEP [label=","] limbo -> limbo [label="space"] ESCAPE -> LITERAL QUOTE -> QUOTE_END [label="\""] QUOTE -> QUOTE [label="otherwise"] QUOTE_END -> limbo [label="space"] QUOTE_END -> NUMBER [label="numbers"] QUOTE_END -> OPERATOR [label="reOps"] QUOTE_END -> PAREN [label="()[]"] QUOTE_END -> SEP [label=","] QUOTE_END -> LITERAL [label="otherwise"] OPERATOR -> NUMBER [label="numbers"] OPERATOR -> limbo [label="space"] OPERATOR -> OPERATOR [label="reOps"] OPERATOR -> PAREN [label="()[]"] OPERATOR -> SEP [label=","] OPERATOR -> LITERAL [label="otherwise"] NUMBER -> NUMBER [label="numbers"] NUMBER -> OPERATOR [label="reOps"] NUMBER -> QUOTE [label="\""] NUMBER -> limbo [label="space"] NUMBER -> PAREN [label="()[]"] NUMBER -> SEP [label=","] NUMBER -> LITERAL [label="otherwise"] PAREN -> PUSH_AND_PAREN [label="()[]"] PAREN -> NUMBER [label="numbers"] PAREN -> OPERATOR [label="reOps"] PAREN -> QUOTE [label="\""] PAREN -> limbo [label="space"] PAREN -> SEP [label=","] PAREN -> LITERAL [label="otherwise"] SEP -> PAREN [label="()[]"] SEP -> NUMBER [label="numbers"] SEP -> OPERATOR [label="reOps"] SEP -> QUOTE [label="\""] SEP -> limbo [label="space"] SEP -> PUSH_AND_SEP [label=","] SEP -> LITERAL [label="otherwise"] LITERAL -> end [label="\\n"] NUMBER -> end [label="\\n"] QUOTE_END -> end [label="\\n"] OPERATOR -> end [label="\\n"] PAREN -> end [label="\\n"] start [shape=Mdiamond]; end [shape=Msquare]; concentrate=true; } */