123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802 |
- import { CommonTokenStream, InputStream } from 'antlr4/index';
- import * as Expressions from './expressions/';
- import * as Commands from './commands/';
- import { Types } from './types';
- import { SyntaxError } from './SyntaxError';
- export class IVProgParser {
- // <BEGIN scope consts>
- static get BASE () {
- return 0;
- }
- static get FUNCTION () {
- return 1;
- }
- static get COMMAND () {
- return 2;
- }
- static get LOOP () {
- return 4;
- }
- // </ END scope consts>
- constructor (input, lexerClass) {
- this.lexerClass = lexerClass;
- this.lexer = new lexerClass(new InputStream(input));
- this.tokenStream = new CommonTokenStream(this.lexer);
- this.tokenStream.fill();
- this.pos = 1;
- this.variableTypes = [this.lexerClass.RK_INTEGER,
- this.lexerClass.RK_REAL,
- this.lexerClass.RK_BOOLEAN,
- this.lexerClass.RK_STRING
- ];
- this.functionTypes = this.variableTypes.concat(this.lexerClass.RK_VOID);
- this.parsingArrayDimension = 0;
- }
- parseTree () {
- return this.parseProgram();
- }
- getToken (index = this.pos) {
- // if(index === null)
- // index = this.pos;
- return this.tokenStream.LT(index);
- }
- isEOF () {
- this.getToken(this.pos);
- return this.tokenStream.fetchedEOF;
- }
- parseProgram () {
- const token = this.getToken();
- let globalVars = [];
- let functions = [];
- if(this.lexerClass.RK_PROGRAM === token.type) {
- this.pos++;
- this.consumeNewLines();
- this.checkOpenCurly();
- this.pos++;
- while(true) {
- this.consumeNewLines();
- const token = this.getToken();
- if (token.type === this.lexerClass.RK_CONST || token.type === this.lexerClass.ID) {
- globalVars = globalVars.concat(this.parseGlobalVariables());
- } else if (token.type === this.lexerClass.RK_FUNCTION) {
- functions = functions.concat(this.parseFunction());
- } else {
- break;
- }
- }
- this.consumeNewLines();
- this.checkCloseCurly();
- this.pos++;
- this.consumeNewLines();
- if(!this.isEOF()) {
- throw new Error("No extra characters are allowed after 'program {...}'");
- }
- return {global: globalVars, functions: functions};
- } else {
- throw SyntaxError.createError(this.lexer.literalNames[this.lexerClass.RK_PROGRAM], token);
- }
- }
- checkOpenCurly () {
- const token = this.getToken();
- if(this.lexerClass.OPEN_CURLY !== token.type){
- throw SyntaxError.createError('{', token);
- }
- }
- checkCloseCurly () {
- const token = this.getToken();
- if(this.lexerClass.CLOSE_CURLY !== token.type){
- throw SyntaxError.createError('}', token);
- }
- }
- /* It checks if the current token at position pos is a ']'.
- * As a check function it doesn't increment pos.
- *
- * @params bool:attempt, indicates that the token is optional. Defaults: false
- *
- * @returns true if the attempt is true and current token is '[',
- * false is attempt is true and current token is not '['
- **/
- checkOpenBrace (attempt = false) {
- const token = this.getToken();
- if(this.lexerClass.OPEN_BRACE !== token.type){
- if (!attempt) {
- throw SyntaxError.createError('[', token);
- } else {
- return false;
- }
- }
- return true;
- }
- checkCloseBrace (attempt = false) {
- const token = this.getToken();
- if(this.lexerClass.CLOSE_BRACE !== token.type){
- if (!attempt) {
- throw SyntaxError.createError(']', token);
- } else {
- return false;
- }
- }
- return true;
- }
- checkOpenParenthesis (attempt = false) {
- const token = this.getToken();
- if(this.lexerClass.OPEN_PARENTHESIS !== token.type){
- if (!attempt) {
- throw SyntaxError.createError('(', token);
- } else {
- return false;
- }
- }
- return true;
- }
- checkCloseParenthesis (attempt = false) {
- const token = this.getToken();
- if(this.lexerClass.CLOSE_PARENTHESIS !== token.type){
- if (!attempt) {
- throw SyntaxError.createError(')', token);
- } else {
- return false;
- }
- }
- return true;
- }
- checkEOS (attempt = false) {
- const eosToken = this.getToken();
- if (eosToken.type !== this.lexerClass.EOS) {
- if (!attempt)
- throw SyntaxError.createError('new line or \';\'', eosToken);
- else
- return false;
- }
- return true;
- }
- parseGlobalVariables () {
- const decl = this.parseMaybeConst();
- const eosToken = this.getToken();
- this.checkEOS();
- this.pos++;
- return decl;
- }
- /*
- * Checks if the next token is PR_CONST. It's only available
- * at global variables declaration level
- * @returns Declararion(const, type, id, initVal?)
- **/
- parseMaybeConst () {
- const constToken = this.getToken();
- if(constToken.type === this.lexerClass.RK_CONST) {
- this.pos++;
- const typeString = this.parseType();
- return this.parseDeclararion(typeString, true);
- } else if(this.isVariableType(constToken)) {
- this.pos++;
- return this.parseDeclararion(constToken);
- } else {
- throw SyntaxError.createError(this.lexer.literalNames[this.lexerClass.RK_CONST] + ' or ' + this.getTypesAsString(), constToken);
- }
- }
- /*
- * Parses a declarion of the form: type --- id --- (= --- EAnd)?
- * @returns a list of Declararion(const, type, id, initVal?)
- **/
- parseDeclararion (typeString, isConst = false) {
- let initial = null;
- let dim1 = null;
- let dim2 = null;
- const idString = this.parseID();
- // Check for array or vector
- // ID[int/IDi][int/IDj]
- if (this.checkOpenBrace(true)) {
- this.pos++;
- this.consumeNewLines();
- dim1 = this.parseArrayDimension();
- this.consumeNewLines();
- this.checkCloseBrace();
- this.pos++;
- if(this.checkOpenBrace(true)) {
- this.pos++;
- this.consumeNewLines();
- dim2 = this.parseArrayDimension();
- this.consumeNewLines();
- this.checkCloseBrace();
- this.pos++;
- }
- }
- const equalsToken = this.getToken();
- if(equalsToken.type === this.lexerClass.EQUAL) {
- this.pos++;
- initial = this.parseExpressionOR();
- }
- let declaration = null;
- if (dim1 !== null) {
- declaration = new Commands.ArrayDeclaration(idString,
- typeString, dim1, dim2, initial, isConst);
- } else {
- declaration = new Commands.Declaration(idString, typeString, initial, isConst);
- }
- const commaToken = this.getToken();
- if(commaToken.type === this.lexerClass.COMMA) {
- console.log("comma found");
- this.pos++;
- this.consumeNewLines();
- return [declaration]
- .concat(this.parseDeclararion(typeString, isConst));
- } else {
- return [declaration]
- }
- }
- consumeNewLines () {
- let token = this.getToken();
- while(token.type === this.lexerClass.EOS && token.text.match('[\r\n]+')) {
- this.pos++;
- token = this.getToken();
- }
- }
- isVariableType (token) {
- return this.variableTypes.find(v => v === token.type);
- }
- /*
- * Reads the next token of the stream to check if it is a Integer or an ID.
- * @returns Integer | ID
- **/
- parseArrayDimension () {
- const dimToken = this.getToken();
- if(dimToken.type === this.lexerClass.INTEGER) {
- //parse as int literal
- this.pos++;
- return this.getIntLiteral(dimToken);
- } else if(dimToken.type === this.lexerClass.ID) {
- //parse as variable
- this.pos++;
- return this.parseVariable(dimToken);
- } else {
- throw SyntaxError.createError('int or ID', dimToken);
- }
- }
- /*
- * Returns an object {type: 'int', value: value}.
- * It checks for binary and hexadecimal integers.
- * @returns object with fields type and value
- **/
- getIntLiteral (token) {
- const text = token.text;
- let val = null;
- if(text.match('^0b|^0B')) {
- val = parseInt(text.substring(2), 2);
- } else if (text.match('^0x|^0X')) {
- val = parseInt(text.substring(2), 16);
- } else {
- val = parseInt(text);
- }
- return new Expressions.IntLiteral(val);
- }
- getRealLiteral (token) {
- return new Expressions.RealLiteral(parseFloat(token.text));
- }
- getStringLiteral (token) {
- const text = token.text;
- let value = text.replace("\\b", "\b");
- value = value.replace("\\t", "\t");
- value = value.replace("\\n", "\n");
- value = value.replace("\\r", "\r");
- value = value.replace("\\\"", "\"");
- value = value.replace("\\\'", "\'");
- value = value.replace("\\\\", "\\");
- return new Expressions.StringLiteral(value);
- }
- getBoolLiteral (token) {
- const val = token.type === this.lexerClass.RK_True ? true : false;
- return new Expressions.BoolLiteral(val);
- }
- parseArrayLiteral () {
- this.checkOpenCurly();
- const beginArray = this.getToken();
- if (this.parsingArrayDimension >= 2) {
- // TODO: better error message
- throw new Error(`Array dimensions exceed maximum size of 2 at line ${beginArray.line}`);
- }
- this.pos++;
- this.parsingArrayDimension++;
- this.consumeNewLines();
- const data = this.parseExpressionList();
- this.consumeNewLines();
- this.checkCloseCurly()
- this.pos++;
- this.parsingArrayDimension--;
- if (this.parsingArrayDimension === 0) {
- if (!data.isValid) {
- // TODO: better error message
- console.log('invalid array');
- throw new Error(`Invalid array at line ${beginArray.line}`);
- }
- }
- return new Expressions.ArrayLiteral(data);
- }
- /*
- * Returns an object {type: 'variable', value: value}.
- * @returns object with fields type and value
- **/
- parseVariable (token) {
- return new Expressions.VariableLiteral(token.text);
- }
- /*
- * Returns an object representing a function. It has
- * four attributes: returnType, id, formalParams and block.
- * The block object has two attributes: declarations and commands
- **/
- parseFunction () {
- let formalParams = [];
- const token = this.getToken();
- if(token.type !== this.lexerClass.RK_FUNCTION) {
- //throw SyntaxError.createError(this.lexer.literalNames[this.lexerClass.PR_FUNCAO], token);
- return null;
- }
- this.pos++;
- const returnType = this.parseType(true);
- const functionID = this.parseID(IVProgParser.FUNCTION);
- this.checkOpenParenthesis();
- this.pos++;
- this.consumeNewLines();
- if (!this.checkCloseParenthesis(true)) {
- formalParams = this.parseFormalParameters(); // formal parameters
- this.consumeNewLines();
- this.checkCloseParenthesis();
- this.pos++;
- } else {
- this.pos++;
- }
- this.consumeNewLines();
- const commandsBlock = this.parseCommandBlock();
- return {returnType: returnType, id: functionID, formalParams: formalParams, block: commandsBlock};
- }
- /*
- * Parse the formal parameters of a function.
- * @returns a list of objects with the following attributes: type, id and dimensions.
- **/
- parseFormalParameters () {
- const list = [];
- while(true) {
- let dimensions = 0;
- const typeString = this.parseType();
- const idString = this.parseID();
- if (this.checkOpenBrace(true)) {
- this.pos++;
- dimensions++;
- this.checkCloseBrace();
- this.pos++;
- if(this.checkOpenBrace(true)) {
- this.pos++;
- dimensions++;
- this.checkCloseBrace();
- this.pos++;
- }
- }
- list.push({type: typeString, id: idString, dimensions: dimensions});
- const commaToken = this.getToken();
- if (commaToken.type !== this.lexerClass.COMMA)
- break;
- this.pos++;
- this.consumeNewLines();
- }
- return list;
- }
- parseID (scope = IVProgParser.BASE) {
- const token = this.getToken();
- if(token.type !== this.lexerClass.ID) {
- throw SyntaxError.createError('ID', token);
- }
- this.pos++;
- if (scope === IVProgParser.FUNCTION) {
- if (token.text === this.lexerClass.MAIN_FUNCTION_NAME){
- return null;
- }
- }
- return token.text;
- }
- parseType (scope = IVProgParser.BASE) {
- const token = this.getToken();
- if(token.type === this.lexerClass.ID && scope === IVProgParser.FUNCTION) {
- return Types.VOID;
- } else if (token.type === this.lexerClass.RK_VOID && scope === IVProgParser.FUNCTION) {
- this.pos++;
- return Types.VOID;
- } else if (this.isVariableType(token)) {
- this.pos++;
- switch(token.type) {
- case this.lexerClass.RK_INTEGER:
- return Types.INTEGER;
- case this.lexerClass.RK_LOGIC:
- return Types.BOOLEAN;
- case this.lexerClass.RK_REAL:
- return Types.REAL;
- case this.lexerClass.RK_STRING:
- return Types.STRING;
- default:
- break;
- }
- }
-
- throw SyntaxError.createError(this.getTypesAsString(scope), token);
- }
- parseCommandBlock (scope = IVProgParser.FUNCTION) {
- let variablesDecl = [];
- const commands = [];
- this.checkOpenCurly();
- this.pos++;
- this.consumeNewLines();
- while(true) {
- const token = this.getToken();
- let cmd = null;
- if (this.isVariableType(token)) {
- if(scope !== IVProgParser.FUNCTION) {
- // TODO better error message
- throw new Error(`Cannot declare variable here (line ${token.line})`);
- }
- this.pos++;
- variablesDecl = variablesDecl.concat(this.parseDeclararion(token));
- this.checkEOS();
- this.pos++;
- cmd = -1;
- } else if (token.type === this.lexerClass.ID) {
- cmd = this.parseIDCommand();
- } else if (token.type === this.lexerClass.RK_RETURN) {
- cmd = this.parseReturn();
- } else if (token.type === this.lexerClass.RK_WHILE) {
- cmd = this.parseWhile();
- } else if (token.type === this.lexerClass.RK_FOR) {
- cmd = this.parseFor();
- } else if (token.type === this.lexerClass.RK_BREAK ) {
- if(scope !== IVProgParser.LOOP) {
- // TODO better error message
- throw new Error("Break cannot be used outside of a loop.");
- }
- cmd = this.parseBreak();
- } else if (token.type === this.lexerClass.RK_SWITCH) {
-
- } else if (token.type === this.lexerClass.RK_DO) {
-
- } else if (token.type === this.lexerClass.RK_IF) {
-
- }
- if (cmd === null)
- break;
- if(cmd !== -1)
- commands.push(cmd);
- }
- this.consumeNewLines();
- this.checkCloseCurly();
- this.pos++;
- this.consumeNewLines();
- return {variables: variablesDecl, commands: commands};
- }
- parseFor () {
- this.pos++;
- this.checkOpenParenthesis();
- this.pos++;
- this.consumeNewLines();
- const attribution = this.parseForAssign();
- this.consumeNewLines();
- const condition = this.parseExpressionOR();
- this.checkEOS();
- this.pos++;
- const increment = this.parseForAssign(true);
- this.checkCloseParenthesis()
- this.pos++;
- this.consumeNewLines();
- const commandsBlock = this.parseCommandBlock(IVProgParser.LOOP);
- return new Commands.For(attribution, condition, increment, commandsBlock);
- }
- parseWhile () {
- this.pos++;
- this.checkOpenParenthesis();
- this.pos++;
- this.consumeNewLines();
- const logicalExpression = this.parseExpressionOR();
- this.consumeNewLines();
- this.checkCloseParenthesis();
- this.pos++;
- this.consumeNewLines();
- const cmdBlocks = this.parseCommandBlock(IVProgParser.LOOP);
- return new Commands.While(logicalExpression, cmdBlocks);
- }
- parseBreak () {
- this.pos++;
- this.checkEOS();
- this.pos++;
- return (new Commands.Break());
- }
- parseReturn () {
- this.pos++;
- let exp = null;
- if(!this.checkEOS(true)) {
- const exp = this.parseExpressionOR();
- this.checkEOS();
- }
- this.pos++;
- return new Commands.Return(exp);
- }
- parseIDCommand () {
- const id = this.parseID();
- const equalOrParenthesis = this.getToken();
- if (equalOrParenthesis.type === this.lexerClass.EQUAL) {
- this.pos++
- const exp = this.parseExpressionOR();
- this.checkEOS();
- this.pos++;
- return (new Commands.Assign(id, exp));
- } else if (equalOrParenthesis.type === this.lexerClass.OPEN_PARENTHESIS) {
- const actualParameters = this.parseActualParameters();
- this.checkEOS();
- this.pos++;
- return (new Expressions.FunctionCall(id, actualParameters));
- } else {
- throw SyntaxError.createError("= or (", equalOrParenthesis);
- }
- }
- parseForAssign (isLast = false) {
- if(!isLast)
- this.consumeNewLines();
- if(this.checkEOS(true)) {
- return null;
- }
- const id = this.parseID();
- const equal = this.getToken();
- if (equal.type !== this.lexerClass.EQUAL) {
- throw SyntaxError.createError('=', equal);
- }
- this.pos++
- const exp = this.parseExpressionOR();
- this.checkEOS();
- this.pos++;
- return new Commands.Assign(id, exp);
- }
- /*
- * Parses an Expression following the structure:
- *
- * EOR => EAnd ( 'or' EOR)? #expression and
- *
- * EOR => ENot ('and' EOR)? #expression or
- *
- * ENot => 'not'? ER #expression not
- *
- * ER => E ((>=, <=, ==, >, <) E)? #expression relational
- *
- * E => factor ((+, -) E)? #expression
- *
- * factor=> term ((*, /, %) factor)?
- *
- * term => literal || arrayAccess || FuncCall || ID || '('EAnd')'
- **/
- parseExpressionOR () {
- const exp1 = this.parseExpressionAND();
- const maybeAnd = this.getToken();
- if (maybeAnd.type === this.lexerClass.OR_OPERATOR) {
- this.pos++;
- const or = 'or';
- this.consumeNewLines();
- const exp2 = this.parseExpressionOR();
- return new Expressions.InfixApp(or, exp1, exp2);
- }
- return exp1;
- }
- parseExpressionAND () {
- const exp1 = this.parseExpressionNot();
- const andToken = this.getToken();
- if (andToken.type === this.lexerClass.AND_OPERATOR) {
- this.pos++;
- const and = 'and';
- this.consumeNewLines();
- const exp2 = this.parseExpressionAND();
- return new Expressions.InfixApp(and, exp1, exp2);
- }
- return exp1;
- }
- parseExpressionNot () {
- const maybeNotToken = this.getToken();
- if (maybeNotToken.type === this.lexerClass.NOT_OPERATOR) {
- this.pos++;
- const not = 'not';
- const exp1 = this.parseExpressionRel();
- return new Expressions.UnaryApp(not, exp1);
- } else {
- return this.parseExpressionRel();
- }
- }
- parseExpressionRel () {
- const exp1 = this.parseExpression();
- const relToken = this.getToken();
- if(relToken.type === this.lexerClass.RELATIONAL_OPERATOR) {
- this.pos++;
- const rel = relToken.text; // TODO: source code line/column information
- const exp2 = this.parseExpression();
- return new Expressions.InfixApp(rel, exp1, exp2);
- }
- return exp1;
- }
- parseExpression () {
- const factor = this.parseFactor();
- const sumOpToken = this.getToken();
- if(sumOpToken.type === this.lexerClass.SUM_OP) {
- this.pos++;
- const op = sumOpToken.text; // TODO: source code line/column information
- const exp = this.parseExpression();
- return new Expressions.InfixApp(op, factor, exp);
- }
- return factor;
- }
- parseFactor () {
- const term = this.parseTerm();
- const multOpToken = this.getToken();
- if(multOpToken.type === this.lexerClass.MULTI_OP) {
- this.pos++;
- const op = multOpToken.text; // TODO: source code line/column information
- const factor = this.parseFactor();
- return new Expressions.InfixApp(op, term, factor);
- }
- return term;
- }
- parseTerm () {
- const token = this.getToken();
- switch(token.type) {
- case this.lexerClass.INTEGER:
- this.pos++;
- return this.getIntLiteral(token);
- case this.lexerClass.REAL:
- this.pos++;
- return this.getRealLiteral(token);
- case this.lexerClass.STRING:
- this.pos++;
- return this.getStringLiteral(token);
- case this.lexerClass.RK_TRUE:
- case this.lexerClass.RK_FALSE:
- this.pos++;
- return this.getBoolLiteral(token);
- case this.lexerClass.OPEN_CURLY:
- return this.parseArrayLiteral();
- case this.lexerClass.ID:
- return this.parseIDTerm();
- case this.lexerClass.OPEN_PARENTHESIS:
- return this.parseParenthesisExp();
- default:
- throw SyntaxError.createError('Terminal', token);
- }
- }
- parseIDTerm () {
- const id = this.parseID();
- const last = this.pos;
- if(this.checkOpenBrace(true)) {
- this.pos++;
- const firstIndex = this.parseExpression();
- let secondIndex = null;
- this.consumeNewLines();
- this.checkCloseBrace();
- this.pos++;
- if(this.checkOpenBrace(true)){
- this.pos++;
- secondIndex = this.parseExpression();
- this.consumeNewLines();
- this.checkCloseBrace();
- this.pos++;
- } else {
- this.pos--;
- }
- return new Expressions.ArrayAccess(id, firstIndex, secondIndex);
- } else if (this.checkOpenParenthesis(true)) {
- this.pos++;
- this.consumeNewLines();
- let actualParameters = [];
- if(!this.checkCloseParenthesis(true)) {
- actualParameters = this.parseActualParameters();
- this.consumeNewLines();
- this.checkCloseParenthesis();
- this.pos++;
- } else {
- this.pos++;
- }
- return new Expressions.FunctionCall(id, actualParameters);
- } else {
- this.pos = last;
- return id;
- }
- }
- parseParenthesisExp () {
- this.checkOpenParenthesis();
- this.pos++;
- this.consumeNewLines();
- const exp = this.parseExpressionOR();
- this.consumeNewLines();
- this.checkCloseParenthesis();
- this.pos++;
- return exp;
- }
- parseActualParameters () {
- this.checkOpenParenthesis();
- this.pos++;
- this.consumeNewLines();
- list = this.parseExpressionList();
- this.consumeNewLines();
- this.checkCloseParenthesis();
- this.pos++;
- return list;
- }
- parseExpressionList () {
- const list = [];
- while(true) {
- const exp = this.parseExpressionOR();
- list.push(exp);
- const maybeToken = this.getToken();
- if (maybeToken.type !== this.lexerClass.COMMA) {
- break;
- } else {
- this.pos++;
- this.consumeNewLines();
- }
- }
- return list;
- }
- getTypesAsString (scope = IVProgParser.BASE) {
- const types = scope === IVProgParser.FUNCTION ? this.functionTypes : this.variableTypes;
- return types.map( x => this.lexer.literalNames[x])
- .reduce((o, n) => {
- if (o.length <= 0)
- return n;
- else
- return o + ", " + n;
- }, '');
- }
- }
|