Commit 2ded42e9 by Torkel Ödegaard

improved parser code

parent 35ae9e33
...@@ -130,22 +130,12 @@ define([ ...@@ -130,22 +130,12 @@ define([
i2 >= 48 && i2 <= 57; // 0-9 i2 >= 48 && i2 <= 57; // 0-9
} }
var Token = {
Identifier: "Identifier",
NumericLiteral: "NumericLiteral",
StringLiteral: "StringLiteral",
Punctuator: "Punctuator"
};
function Lexer(expression) { function Lexer(expression) {
this.input = expression; this.input = expression;
this.char = 1; this.char = 1;
this.from = 1; this.from = 1;
} }
Lexer.Token = Token;
Lexer.prototype = { Lexer.prototype = {
peek: function (i) { peek: function (i) {
...@@ -344,7 +334,7 @@ define([ ...@@ -344,7 +334,7 @@ define([
switch (id) { switch (id) {
default: default:
type = Token.Identifier; type = "identifier";
} }
return { return {
...@@ -415,7 +405,7 @@ define([ ...@@ -415,7 +405,7 @@ define([
if (value.length <= 2) { // 0x if (value.length <= 2) { // 0x
return { return {
type: Token.NumericLiteral, type: 'number',
value: value, value: value,
isMalformed: true isMalformed: true
}; };
...@@ -429,7 +419,7 @@ define([ ...@@ -429,7 +419,7 @@ define([
} }
return { return {
type: Token.NumericLiteral, type: 'number',
value: value, value: value,
base: 16, base: 16,
isMalformed: false isMalformed: false
...@@ -465,7 +455,7 @@ define([ ...@@ -465,7 +455,7 @@ define([
} }
return { return {
type: Token.NumericLiteral, type: 'number',
value: value, value: value,
base: 8, base: 8,
isMalformed: false isMalformed: false
...@@ -545,7 +535,7 @@ define([ ...@@ -545,7 +535,7 @@ define([
} }
return { return {
type: Token.NumericLiteral, type: 'number',
value: value, value: value,
base: 10, base: 10,
isMalformed: !isFinite(value) isMalformed: !isFinite(value)
...@@ -563,7 +553,7 @@ define([ ...@@ -563,7 +553,7 @@ define([
case "{": case "{":
case "}": case "}":
return { return {
type: Token.Punctuator, type: ch1,
value: ch1 value: ch1
}; };
} }
...@@ -594,93 +584,22 @@ define([ ...@@ -594,93 +584,22 @@ define([
var value = ""; var value = "";
var startLine = this.line; var startLine = this.line;
var startChar = this.char; var startChar = this.char;
var allowNewLine = false;
this.skip(); this.skip();
while (this.peek() !== quote) { while (this.peek() !== quote) {
while (this.peek() === "") { // End Of Line
// If an EOL is not preceded by a backslash, show a warning
// and proceed like it was a legit multi-line string where
// author simply forgot to escape the newline symbol.
//
// Another approach is to implicitly close a string on EOL
// but it generates too many false positives.
if (!allowNewLine) {
this.trigger("warning", {
code: "W112",
line: this.line,
character: this.char
});
} else {
allowNewLine = false;
// Otherwise show a warning if multistr option was not set.
// For JSON, show warning no matter what.
this.triggerAsync("warning", {
code: "W043",
line: this.line,
character: this.char
}, checks, function () { return !state.option.multistr; });
this.triggerAsync("warning", {
code: "W042",
line: this.line,
character: this.char
}, checks, function () { return state.jsonMode && state.option.multistr; });
}
// If we get an EOF inside of an unclosed string, show an
// error and implicitly close it at the EOF point.
if (!this.nextLine()) {
this.trigger("error", {
code: "E029",
line: startLine,
character: startChar
});
return {
type: Token.StringLiteral,
value: value,
isUnclosed: true,
quote: quote
};
}
}
allowNewLine = false;
var char = this.peek(); var char = this.peek();
var jump = 1; // A length of a jump, after we're done var jump = 1; // A length of a jump, after we're done
// parsing this character. // parsing this character.
if (char < " ") {
// Warn about a control character in a string.
this.trigger("warning", {
code: "W113",
line: this.line,
character: this.char,
data: [ "<non-printable>" ]
});
}
// Special treatment for some escaped characters. // Special treatment for some escaped characters.
if (char === "\\") { if (char === "\\") {
this.skip(); this.skip();
char = this.peek(); char = this.peek();
switch (char) { switch (char) {
case "'": case "'":
this.triggerAsync("warning", {
code: "W114",
line: this.line,
character: this.char,
data: [ "\\'" ]
}, checks, function () {return state.jsonMode; });
break; break;
case "b": case "b":
char = "\b"; char = "\b";
...@@ -699,41 +618,16 @@ define([ ...@@ -699,41 +618,16 @@ define([
break; break;
case "0": case "0":
char = "\0"; char = "\0";
// Octal literals fail in strict mode.
// Check if the number is between 00 and 07.
var n = parseInt(this.peek(1), 10);
this.triggerAsync("warning", {
code: "W115",
line: this.line,
character: this.char
}, checks,
function () { return n >= 0 && n <= 7 && state.directive["use strict"]; });
break; break;
case "u": case "u":
char = String.fromCharCode(parseInt(this.input.substr(1, 4), 16)); char = String.fromCharCode(parseInt(this.input.substr(1, 4), 16));
jump = 5; jump = 5;
break; break;
case "v": case "v":
this.triggerAsync("warning", {
code: "W114",
line: this.line,
character: this.char,
data: [ "\\v" ]
}, checks, function () { return state.jsonMode; });
char = "\v"; char = "\v";
break; break;
case "x": case "x":
var x = parseInt(this.input.substr(1, 2), 16); var x = parseInt(this.input.substr(1, 2), 16);
this.triggerAsync("warning", {
code: "W114",
line: this.line,
character: this.char,
data: [ "\\x-" ]
}, checks, function () { return state.jsonMode; });
char = String.fromCharCode(x); char = String.fromCharCode(x);
jump = 3; jump = 3;
break; break;
...@@ -742,7 +636,6 @@ define([ ...@@ -742,7 +636,6 @@ define([
case "/": case "/":
break; break;
case "": case "":
allowNewLine = true;
char = ""; char = "";
break; break;
case "!": case "!":
...@@ -753,11 +646,6 @@ define([ ...@@ -753,11 +646,6 @@ define([
/*falls through */ /*falls through */
default: default:
// Weird escaping. // Weird escaping.
this.trigger("warning", {
code: "W044",
line: this.line,
character: this.char
});
} }
} }
...@@ -767,7 +655,7 @@ define([ ...@@ -767,7 +655,7 @@ define([
this.skip(); this.skip();
return { return {
type: Token.StringLiteral, type: 'string',
value: value, value: value,
isUnclosed: false, isUnclosed: false,
quote: quote quote: quote
......
...@@ -20,186 +20,147 @@ define([ ...@@ -20,186 +20,147 @@ define([
this.lexer = new Lexer(expression); this.lexer = new Lexer(expression);
this.state = "start"; this.state = "start";
this.error = null; this.error = null;
this.tokens = this.lexer.tokenize();
this.index = 0;
} }
Parser.Nodes = NodeTypes; Parser.Nodes = NodeTypes;
Parser.prototype = { Parser.prototype = {
getAst: function () { getAst: function () {
return this.parse('start'); return this.start();
}, },
isUnexpectedToken: function (expected, value) { start: function () {
if (this.token === null) { return this.functionCall() || this.metricExpression();
this.error = "Expected token: " + expected + " instead found end of string"; },
return true;
}
if (this.token.type === expected) { metricExpression: function() {
return false; if (!this.match('identifier')) {
return null;
} }
if (value && this.token.value === value) { var node = {
return false; type: 'metric',
segments: [{
type: 'segment',
value: this.tokens[this.index].value
}]
} }
this.error = "Expected token " + expected + this.index++;
' instead found token ' + this.token.type +
' ("' + this.token.value + '")' +
" at position: " + this.lexer.char;
return true; if (this.match('.')) {
this.index++;
var rest = this.metricExpression();
node.segments = node.segments.concat(rest.segments)
}
return node;
}, },
parse: function (state, allowParams) { matchToken: function(type, index) {
var node = { }; var token = this.tokens[this.index + index];
return (token === undefined && type === '') ||
token && token.type === type;
},
while(true) { match: function(token1, token2) {
this.token = this.lexer.next(); return this.matchToken(token1, 0) &&
(!token2 || this.matchToken(token2, 1))
},
switch(state) { functionCall: function() {
case "start": if (!this.match('identifier', '(')) {
if (allowParams) {
if (this.token === null) {
return null; return null;
} }
if (this.token.type === Lexer.Token.NumericLiteral) { var node = {
return { type: 'function',
type: NodeTypes.NumericLiteral, name: this.tokens[this.index].value,
value: parseInt(this.token.value)
}; };
}
if (this.token.type === Lexer.Token.StringLiteral) { this.index += 2;
return {
type: NodeTypes.StringLiteral,
value: this.token.value
};
}
}
if (this.isUnexpectedToken(Lexer.Token.Identifier)) { node.params = this.functionParameters();
return;
}
state = "identifier"; if (!this.match(')')) {
this.prevToken = this.token; this.error = 'missing closing paranthesis';
break;
case "identifier":
if (this.token == null || (allowParams && this.token.value === ',')) {
return {
type: NodeTypes.MetricExpression,
segments: [{
type: NodeTypes.MetricExpression,
value: this.prevToken.value
}]
};
}
if (this.isUnexpectedToken(Lexer.Token.Punctuator)) {
return null; return null;
} }
if (this.token.value === '.') { this.index++;
state = "metricNode";
node.type = NodeTypes.MetricExpression;
node.segments = [{
type: NodeTypes.MetricNode,
value: this.prevToken.value
}];
continue;
}
if (this.token.value === '(') {
node.type = NodeTypes.FunctionCall;
node.name = this.prevToken.value;
node.params = this.parseFunc();
return node;
}
if (this.token.value === ')') {
return node; return node;
} },
break;
case 'metricEnd': functionParameters: function () {
if (this.token === null) { if (this.match(')') || this.match('')) {
return node; return [];
} }
if (this.isUnexpectedToken(Lexer.Token.Punctuator)) { var param =
return null; this.functionCall() ||
} this.metricExpression() ||
this.numericLiteral() ||
this.stringLiteral();
if (this.token.value === '.') { if (!this.match(',')) {
state = 'metricNode'; return [param];
} }
if (allowParams && (this.token.value === ',' || this.token.value === ')')) { this.index++;
return node; return [param].concat(this.functionParameters());
} },
break; numericLiteral: function () {
case 'metricNode': if (!this.match('number')) {
if (this.isUnexpectedToken(Lexer.Token.Identifier)) {
return null; return null;
} }
node.segments.push({ this.index++;
type: NodeTypes.MetricNode,
value: this.token.value
});
state = 'metricEnd'; return {
break; type: 'number',
default: value: this.tokens[this.index-1].value
this.error = 'unknown token: ' + this.token.type; };
}
}
}, },
parseFunc: function() { stringLiteral: function () {
var arguments = []; if (!this.match('string')) {
var arg;
while(true) {
arg = this.parse('start', true);
if (arg === null) {
this.error = "expected function arguments";
return null; return null;
} }
arguments.push(arg); this.index++;
if (this.token === null) { return {
this.error = "expected closing function at position: " + this.lexer.char; type: 'string',
return null; value: this.tokens[this.index-1].value
} };
},
if (this.token.value === ')') { isUnexpectedToken: function (expected, value) {
return arguments; if (this.token === null) {
this.error = "Expected token: " + expected + " instead found end of string";
return true;
} }
if (this.token.type === Lexer.Token.NumericLiteral || if (this.token.type === expected) {
this.token.type === Lexer.Token.StringLiteral) { return false;
this.token = this.lexer.next();
} }
if (this.isUnexpectedToken(Lexer.Token.Punctuator, ',')) { if (value && this.token.value === value) {
return null; return false;
} }
if (this.token.value === ')') { this.error = "Expected token " + expected +
return arguments; ' instead found token ' + this.token.type +
} ' ("' + this.token.value + '")' +
} " at position: " + this.lexer.char;
} return true;
},
}; };
return Parser; return Parser;
......
...@@ -9,22 +9,22 @@ define([ ...@@ -9,22 +9,22 @@ define([
var tokens = lexer.tokenize(); var tokens = lexer.tokenize();
expect(tokens[0].value).to.be('metric'); expect(tokens[0].value).to.be('metric');
expect(tokens[1].value).to.be('.'); expect(tokens[1].value).to.be('.');
expect(tokens[2].type).to.be(Lexer.Token.Identifier); expect(tokens[2].type).to.be('identifier');
expect(tokens[3].type).to.be(Lexer.Token.Punctuator); expect(tokens[4].type).to.be('identifier');
}); });
it('should tokenize functions and args', function() { it('should tokenize functions and args', function() {
var lexer = new Lexer("sum(metric.test, 12, 'test')"); var lexer = new Lexer("sum(metric.test, 12, 'test')");
var tokens = lexer.tokenize(); var tokens = lexer.tokenize();
expect(tokens[0].value).to.be('sum'); expect(tokens[0].value).to.be('sum');
expect(tokens[0].type).to.be(Lexer.Token.Identifier); expect(tokens[0].type).to.be('identifier');
expect(tokens[1].value).to.be('('); expect(tokens[1].value).to.be('(');
expect(tokens[1].type).to.be(Lexer.Token.Punctuator); expect(tokens[1].type).to.be('(');
expect(tokens[5].type).to.be(Lexer.Token.Punctuator); expect(tokens[5].type).to.be(',');
expect(tokens[5].value).to.be(','); expect(tokens[5].value).to.be(',');
expect(tokens[6].type).to.be(Lexer.Token.NumericLiteral); expect(tokens[6].type).to.be('number');
expect(tokens[6].value).to.be('12'); expect(tokens[6].value).to.be('12');
expect(tokens[8].type).to.be(Lexer.Token.StringLiteral); expect(tokens[8].type).to.be('string');
expect(tokens[8].value).to.be('test'); expect(tokens[8].value).to.be('test');
expect(tokens[tokens.length - 1].value).to.be(')'); expect(tokens[tokens.length - 1].value).to.be(')');
}); });
......
...@@ -9,7 +9,7 @@ define([ ...@@ -9,7 +9,7 @@ define([
var rootNode = parser.getAst(); var rootNode = parser.getAst();
expect(parser.error).to.be(null); expect(parser.error).to.be(null);
expect(rootNode.type).to.be(Parser.Nodes.MetricExpression); expect(rootNode.type).to.be('metric');
expect(rootNode.segments.length).to.be(5); expect(rootNode.segments.length).to.be(5);
expect(rootNode.segments[0].value).to.be('metric'); expect(rootNode.segments[0].value).to.be('metric');
...@@ -19,7 +19,7 @@ define([ ...@@ -19,7 +19,7 @@ define([
var parser = new Parser('sum(test)'); var parser = new Parser('sum(test)');
var rootNode = parser.getAst(); var rootNode = parser.getAst();
expect(parser.error).to.be(null); expect(parser.error).to.be(null);
expect(rootNode.type).to.be(Parser.Nodes.FunctionCall); expect(rootNode.type).to.be('function');
expect(rootNode.params.length).to.be(1); expect(rootNode.params.length).to.be(1);
}); });
...@@ -28,11 +28,11 @@ define([ ...@@ -28,11 +28,11 @@ define([
var rootNode = parser.getAst(); var rootNode = parser.getAst();
expect(parser.error).to.be(null); expect(parser.error).to.be(null);
expect(rootNode.type).to.be(Parser.Nodes.FunctionCall); expect(rootNode.type).to.be('function');
expect(rootNode.params.length).to.be(3); expect(rootNode.params.length).to.be(3);
expect(rootNode.params[0].type).to.be(Parser.Nodes.MetricExpression); expect(rootNode.params[0].type).to.be('metric');
expect(rootNode.params[1].type).to.be(Parser.Nodes.NumericLiteral); expect(rootNode.params[1].type).to.be('number');
expect(rootNode.params[2].type).to.be(Parser.Nodes.StringLiteral); expect(rootNode.params[2].type).to.be('string');
}); });
it('function with nested function', function() { it('function with nested function', function() {
...@@ -40,13 +40,13 @@ define([ ...@@ -40,13 +40,13 @@ define([
var rootNode = parser.getAst(); var rootNode = parser.getAst();
expect(parser.error).to.be(null); expect(parser.error).to.be(null);
expect(rootNode.type).to.be(Parser.Nodes.FunctionCall); expect(rootNode.type).to.be('function');
expect(rootNode.params.length).to.be(1); expect(rootNode.params.length).to.be(1);
expect(rootNode.params[0].type).to.be(Parser.Nodes.FunctionCall); expect(rootNode.params[0].type).to.be('function');
expect(rootNode.params[0].name).to.be('scaleToSeconds'); expect(rootNode.params[0].name).to.be('scaleToSeconds');
expect(rootNode.params[0].params.length).to.be(2); expect(rootNode.params[0].params.length).to.be(2);
expect(rootNode.params[0].params[0].type).to.be(Parser.Nodes.MetricExpression); expect(rootNode.params[0].params[0].type).to.be('metric');
expect(rootNode.params[0].params[1].type).to.be(Parser.Nodes.NumericLiteral); expect(rootNode.params[0].params[1].type).to.be('number');
}); });
it('function with multiple series', function() { it('function with multiple series', function() {
...@@ -54,10 +54,10 @@ define([ ...@@ -54,10 +54,10 @@ define([
var rootNode = parser.getAst(); var rootNode = parser.getAst();
expect(parser.error).to.be(null); expect(parser.error).to.be(null);
expect(rootNode.type).to.be(Parser.Nodes.FunctionCall); expect(rootNode.type).to.be('function');
expect(rootNode.params.length).to.be(2); expect(rootNode.params.length).to.be(2);
expect(rootNode.params[0].type).to.be(Parser.Nodes.MetricExpression); expect(rootNode.params[0].type).to.be('metric');
expect(rootNode.params[1].type).to.be(Parser.Nodes.MetricExpression); expect(rootNode.params[1].type).to.be('metric');
}); });
}); });
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment