- +
- +
diff --git a/article.css b/article.css new file mode 100644 index 0000000..5281725 --- /dev/null +++ b/article.css @@ -0,0 +1,168 @@ +main { + margin: 24px 0 48px; +} + +main h2 { + margin: 0 0 8px; + color: #bbb; + font-size: 24pt; + font-weight: bold; +} + +main p { + margin: 0 0 8px; + line-height: 1.35em; + text-indent: 2.5em; + text-align: justify; + font-size: 13pt; + font-weight: normal; +} + +main .footer { + font-size: 10pt; + text-align: center; +} + +main code { + padding: 0 3px; + background-color: #1d1f21; + color: #de935f; + font-family: 'Source Code Pro', 'Ubuntu Mono', 'Courier New', monospace; +} + +main pre { /* tomorrow night: https://github.com/chriskempson/tomorrow-theme */ + margin: 14px 2px; + padding: 10px 16px; + border-left: 4px solid #7f7f7f; + background-color: #1d1f21; + color: #ddd; + font-size: 12pt; + font-weight: normal; + font-family: 'Source Code Pro', 'Ubuntu Mono', 'Courier New', monospace; +} + +main pre > .prop { + color: #cc6666; +} + +main pre > .fn { + color: #f0c674; +} + +main pre > .bool { + color: #b294bb; +} + +main pre > .str { + color: #b5bd68; +} + +main pre > .num { + color: #81a2be; +} + +main pre > .op { + color: #ccc; +} + +main strong { + color: #ccc; + font-weight: bold; +} + +main .rb-text { + background-image: linear-gradient(to left, #f5f, #a0a, #5ff, #5f5, #ff5, #fa0, #a00, #f5f); + background-size: 300% 100%; + -webkit-background-clip: text; + color: transparent; + animation: scroll-bg 4s linear infinite; +} + +main .math { + font-family: 'CMU Serif', 'Cambria Math', 'Times New Roman', serif; +} + +main .heart { + color: #e44078; +} + +@keyframes scroll-bg { + 0% { + background-position-x: 0; + } + 100% { + background-position-x: 300%; + } +} + +.full-width { + width: 100%; + margin: 4px 0 32px; + padding: 0; +} + +.full-width > img { + width: 100%; + background-color: #000; + filter: brightness(0.7) contrast(1.2) grayscale(0.5); +} + +.section { + margin: 0 25vw 28px; +} + +.docs { + margin: 14px 0; +} + +.docs h3 { + margin: 0 0 8px; + color: #aaa; + font-size: 20pt; + font-weight: bold; +} + +.docs-entry { + margin: 4px 0 16px; +} + +.docs-entry-key { + margin-bottom: 6px; + padding: 4px 6px; + display: flex; + flex-flow: row; + align-items: baseline; + background-color: #1d1f21; + font-weight: normal; +} + +.docs-entry-key-id { + color: #cc6666; + font-size: 16pt; + font-family: 'Source Code Pro', 'Ubuntu Mono', 'Courier New', monospace; +} + +.docs-entry-key-type { + flex: 1; + margin-left: 8px; + color: #de935f; + font-size: 11pt; + font-family: 'Source Code Pro', 'Ubuntu Mono', 'Courier New', monospace; +} + +.docs-entry-key-alias { + float: right; + color: #515356; + font-size: 11pt; +} + +.docs-entry-key-alias > .alias { + float: none; + color: #969896; + font-family: 'Source Code Pro', 'Ubuntu Mono', 'Courier New', monospace; +} + +.docs-entry > p { + margin-left: 1.5em; + text-indent: 0; +} diff --git a/expr_parser.js b/expr_parser.js new file mode 100644 index 0000000..13f0a07 --- /dev/null +++ b/expr_parser.js @@ -0,0 +1,805 @@ +/** + * See `expr_parser.md` for notes on the implementation of this parser! + */ +const ExprParser = (function() { + // buffer containing a list of tokens and a movable pointer into the list + class TokenBuf { + constructor(tokens) { + this.tokens = tokens; + this.index = 0; + } + + get peek() { + return this.tokens[this.index]; + } + + consume(termName) { + if (this.peek.type !== termName) { + throw new Error(`Expected a ${termName}, but got a ${this.peek.type}!`) + } + const node = { type: 'term', token: this.peek }; + ++this.index; + return node; + } + } + + // tokenize an expression string + function tokenize(exprStr) { + exprStr = exprStr.trim(); + const tokens = []; + let col = 0; + + function pushSymbol(sym) { + tokens.push({ type: sym }); + col += sym.length; + } + + while (col < exprStr.length) { + // parse fixed symbols, like operators and stuff + switch (exprStr[col]) { + case '(': + case ')': + case ',': + case '&': + case '|': + case '+': + case '-': + case '*': + case '/': + case '^': + case '=': + pushSymbol(exprStr[col]); + continue; + case '>': + pushSymbol(exprStr[col + 1] === '=' ? '>=' : '>'); + continue; + case '<': + pushSymbol(exprStr[col + 1] === '=' ? '<=' : '<'); + continue; + case '!': + pushSymbol(exprStr[col + 1] === '=' ? '!=' : '!'); + continue; + case ' ': // ignore extra whitespace + ++col; + continue; + } + if (exprStr.slice(col, col + 2) === "?=") { + pushSymbol("?="); + continue; + } + // parse a numeric literal + let m; + if ((m = /^\d+(?:\.\d*)?/.exec(exprStr.substring(col))) !== null) { + tokens.push({ type: 'nLit', value: parseFloat(m[0]) }); + col += m[0].length; + continue; + } + // parse a string literal + if ((m = /^"([^"]+)"/.exec(exprStr.substring(col))) !== null) { // with double-quotes + tokens.push({ type: 'sLit', value: m[1] }); + col += m[0].length; + continue; + } + if ((m = /^'([^']+)'/.exec(exprStr.substring(col))) !== null) { // with single-quotes + tokens.push({ type: 'sLit', value: m[1] }); + col += m[0].length; + continue; + } + // parse an identifier or boolean literal + if ((m = /^\w[\w\d%]*/.exec(exprStr.substring(col))) !== null) { + switch (m[0]) { + case 'true': + tokens.push({ type: 'bLit', value: true }); + col += 4; + continue; + case 'false': + tokens.push({ type: 'bLit', value: false }); + col += 5; + continue; + } + tokens.push({ type: 'ident', id: m[0] }); + col += m[0].length; + continue; + } + // if we reach here without successfully parsing a token, it's an error + throw new Error(`Could not parse character "${exprStr[col]}" at position ${col}`); + } + tokens.push({ type: 'eof' }); + return new TokenBuf(tokens); + } + + // parse an AST from a sequence of tokens + function takeExpr(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeConj(tokens)); + return { type: 'nonterm', name: 'expr', prod: 0, children }; + default: + throw new Error('Could not parse an expression!'); + } + } + + function takeExprList(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeExpr(tokens)); + children.push(takeExprList0(tokens)); + return { type: 'nonterm', name: 'exprList', prod: 0, children }; + default: + throw new Error('Could not parse an expression list!'); + } + } + + function takeExprList0(tokens) { + const children = []; + switch (tokens.peek.type) { + case ',': + children.push(tokens.consume(',')); + children.push(takeExpr(tokens)); + children.push(takeExprList0(tokens)); + return { type: 'nonterm', name: 'exprList\'', prod: 0, children }; + case ')': + case 'eof': + return { type: 'nonterm', name: 'exprList\'', prod: 1, children }; + default: + throw new Error('Could not parse a expression list!'); + } + } + + function takeConj(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeDisj(tokens)); + children.push(takeConj0(tokens)); + return { type: 'nonterm', name: 'conj', prod: 0, children }; + default: + throw new Error('Could not parse a conjunction!'); + } + } + + function takeConj0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '&': + children.push(tokens.consume('&')); + children.push(takeDisj(tokens)); + children.push(takeConj0(tokens)); + return { type: 'nonterm', name: 'conj\'', prod: 0, children }; + case ')': + case ',': + case 'eof': + return { type: 'nonterm', name: 'conj\'', prod: 1, children }; + default: + throw new Error('Could not parse a conjunction!'); + } + } + + function takeDisj(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeCmpEq(tokens)); + children.push(takeDisj0(tokens)); + return { type: 'nonterm', name: 'disj', prod: 0, children }; + default: + throw new Error('Could not parse a disjunction!'); + } + } + + function takeDisj0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '|': + children.push(tokens.consume('|')); + children.push(takeCmpEq(tokens)); + children.push(takeDisj0(tokens)); + return { type: 'nonterm', name: 'disj\'', prod: 0, children }; + case '&': + case ')': + case ',': + case 'eof': + return { type: 'nonterm', name: 'disj\'', prod: 1, children }; + default: + throw new Error('Could not parse a disjunction!'); + } + } + + function takeCmpEq(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeCmpRel(tokens)); + children.push(takeCmpEq0(tokens)); + return { type: 'nonterm', name: 'cmpEq', prod: 0, children }; + default: + throw new Error('Could not parse an equality comparison!'); + } + } + + function takeCmpEq0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '=': + children.push(tokens.consume('=')); + children.push(takeCmpRel(tokens)); + children.push(takeCmpEq0(tokens)); + return { type: 'nonterm', name: 'cmpEq\'', prod: 0, children }; + case '!=': + children.push(tokens.consume('!=')); + children.push(takeCmpRel(tokens)); + children.push(takeCmpEq0(tokens)); + return { type: 'nonterm', name: 'cmpEq\'', prod: 1, children }; + case '?=': + children.push(tokens.consume('?=')); + children.push(takeCmpRel(tokens)); + children.push(takeCmpEq0(tokens)); + return { type: 'nonterm', name: 'cmpEq\'', prod: 2, children }; + case '&': + case ')': + case ',': + case '|': + case 'eof': + return { type: 'nonterm', name: 'cmpEq\'', prod: 3, children }; + default: + throw new Error('Could not parse an equality comparison!'); + } + } + + function takeCmpRel(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeSum(tokens)); + children.push(takeCmpRel0(tokens)); + return { type: 'nonterm', name: 'cmpRel', prod: 0, children }; + default: + throw new Error('Could not parse a relational comparison!'); + } + } + + function takeCmpRel0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '<=': + children.push(tokens.consume('<=')); + children.push(takeSum(tokens)); + children.push(takeCmpRel0(tokens)); + return { type: 'nonterm', name: 'cmpRel\'', prod: 0, children }; + case '<': + children.push(tokens.consume('<')); + children.push(takeSum(tokens)); + children.push(takeCmpRel0(tokens)); + return { type: 'nonterm', name: 'cmpRel\'', prod: 1, children }; + case '>': + children.push(tokens.consume('>')); + children.push(takeSum(tokens)); + children.push(takeCmpRel0(tokens)); + return { type: 'nonterm', name: 'cmpRel\'', prod: 2, children }; + case '>=': + children.push(tokens.consume('>=')); + children.push(takeSum(tokens)); + children.push(takeCmpRel0(tokens)); + return { type: 'nonterm', name: 'cmpRel\'', prod: 3, children }; + case '!=': + case '&': + case ')': + case ',': + case '=': + case '?=': + case '|': + case 'eof': + return { type: 'nonterm', name: 'cmpRel\'', prod: 4, children }; + default: + throw new Error('Could not parse a relational comparison!'); + } + } + + function takeSum(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeProd(tokens)); + children.push(takeSum0(tokens)); + return { type: 'nonterm', name: 'sum', prod: 0, children }; + default: + throw new Error('Could not parse an additive expression!'); + } + } + + function takeSum0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '+': + children.push(tokens.consume('+')); + children.push(takeProd(tokens)); + children.push(takeSum0(tokens)); + return { type: 'nonterm', name: 'sum\'', prod: 0, children }; + case '-': + children.push(tokens.consume('-')); + children.push(takeProd(tokens)); + children.push(takeSum0(tokens)); + return { type: 'nonterm', name: 'sum\'', prod: 1, children }; + case '!=': + case '&': + case ')': + case ',': + case '<': + case '<=': + case '=': + case '>': + case '>=': + case '?=': + case '|': + case 'eof': + return { type: 'nonterm', name: 'sum\'', prod: 2, children }; + default: + throw new Error('Could not parse an additive expression!'); + } + } + + function takeProd(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeExp(tokens)); + children.push(takeProd0(tokens)); + return { type: 'nonterm', name: 'prod', prod: 0, children }; + default: + throw new Error('Could not parse a multiplicative expression!'); + } + } + + function takeProd0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '*': + children.push(tokens.consume('*')); + children.push(takeExp(tokens)); + children.push(takeProd0(tokens)); + return { type: 'nonterm', name: 'prod\'', prod: 0, children }; + case '/': + children.push(tokens.consume('/')); + children.push(takeExp(tokens)); + children.push(takeProd0(tokens)); + return { type: 'nonterm', name: 'prod\'', prod: 1, children }; + case '!=': + case '&': + case ')': + case '+': + case ',': + case '-': + case '<': + case '<=': + case '=': + case '>': + case '>=': + case '?=': + case '|': + case 'eof': + return { type: 'nonterm', name: 'prod\'', prod: 2, children }; + default: + throw new Error('Could not parse a multiplicative expression!'); + } + } + + function takeExp(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeUnary(tokens)); + children.push(takeExp0(tokens)); + return { type: 'nonterm', name: 'exp', prod: 0, children }; + default: + throw new Error('Could not parse an exponential expression!'); + } + } + + function takeExp0(tokens) { + const children = []; + switch (tokens.peek.type) { + case '^': + children.push(tokens.consume('^')); + children.push(takeUnary(tokens)); + children.push(takeExp0(tokens)); + return { type: 'nonterm', name: 'exp\'', prod: 0, children }; + case '!=': + case '&': + case ')': + case '*': + case '+': + case ',': + case '-': + case '/': + case '<': + case '<=': + case '=': + case '>': + case '>=': + case '?=': + case '|': + case 'eof': + return { type: 'nonterm', name: 'exp\'', prod: 1, children }; + default: + throw new Error('Could not parse an exponential expression!'); + } + } + + function takeUnary(tokens) { + const children = []; + switch (tokens.peek.type) { + case '-': + children.push(tokens.consume('-')); + children.push(takeUnary(tokens)); + return { type: 'nonterm', name: 'unary', prod: 0, children }; + case '!': + children.push(tokens.consume('!')); + children.push(takeUnary(tokens)); + return { type: 'nonterm', name: 'unary', prod: 1, children }; + case '(': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takePrim(tokens)); + return { type: 'nonterm', name: 'unary', prod: 2, children }; + default: + throw new Error('Could not parse a unary expression!'); + } + } + + function takePrim(tokens) { + const children = []; + switch (tokens.peek.type) { + case 'nLit': + children.push(tokens.consume('nLit')); + return { type: 'nonterm', name: 'prim', prod: 0, children }; + case 'bLit': + children.push(tokens.consume('bLit')); + return { type: 'nonterm', name: 'prim', prod: 1, children }; + case 'sLit': + children.push(tokens.consume('sLit')); + return { type: 'nonterm', name: 'prim', prod: 2, children }; + case 'ident': + children.push(tokens.consume('ident')); + children.push(takeIdentTail(tokens)); + return { type: 'nonterm', name: 'prim', prod: 3, children }; + case '(': + children.push(tokens.consume('(')); + children.push(takeExpr(tokens)); + children.push(tokens.consume(')')); + return { type: 'nonterm', name: 'prim', prod: 4, children }; + default: + throw new Error('Could not parse a primitive value!'); + } + } + + function takeIdentTail(tokens) { + const children = []; + switch (tokens.peek.type) { + case '(': + children.push(tokens.consume('(')); + children.push(takeArgs(tokens)); + children.push(tokens.consume(')')); + return { type: 'nonterm', name: 'identTail', prod: 0, children }; + case '!=': + case '&': + case ')': + case '*': + case '+': + case ',': + case '-': + case '/': + case '<': + case '<=': + case '=': + case '>': + case '>=': + case '?=': + case '^': + case '|': + case 'eof': + return { type: 'nonterm', name: 'identTail', prod: 1, children }; + default: + throw new Error('Could not parse an identifier expression!'); + } + } + + function takeArgs(tokens) { + const children = []; + switch (tokens.peek.type) { + case '!': + case '(': + case '-': + case 'bLit': + case 'ident': + case 'nLit': + case 'sLit': + children.push(takeExprList(tokens)); + return { type: 'nonterm', name: 'args', prod: 0, children }; + case ')': + case 'eof': + return { type: 'nonterm', name: 'args', prod: 1, children }; + default: + throw new Error('Could not parse an argument list!'); + } + } + + // apply tree transformations to recover the nominal-grammar AST + function fixUp(ast) { + if (ast.type === 'term') { + return ast; + } + switch (ast.name) { + case 'exprList': // recover left-recursive structures + case 'conj': + case 'disj': + case 'exp': + return fixUpRightRecurse(ast, 1); + case 'sum': + case 'prod': + return fixUpRightRecurse(ast, 2); + case 'cmpEq': + return fixUpRightRecurse(ast, 3); + case 'cmpRel': + return fixUpRightRecurse(ast, 4); + case 'prim': // recover left-factored identifier things + switch (ast.prod) { + case 3: + switch (ast.children[1].prod) { + case 0: // function call + return { + type: 'nonterm', name: 'prim', prod: 3, + children: [fixUp(ast.children[0]), ...mapFixUp(ast.children[1].children)] + }; + case 1: // just an identifier + return { type: 'nonterm', name: 'prim', prod: 4, children: [fixUp(ast.children[0])] }; + } + break; + case 4: + return { ...ast, prod: 5, children: mapFixUp(ast.children) }; + } + break; + } + return { ...ast, children: mapFixUp(ast.children) }; + } + + function mapFixUp(nodes) { + return nodes.map(chAst => fixUp(chAst)); + } + + function fixUpRightRecurse(ast, maxProd) { + let nomAst = { type: 'nonterm', name: ast.name, prod: maxProd, children: [fixUp(ast.children[0])] }; + let tree = ast.children[1]; + while (tree.prod < maxProd) { + nomAst = { + type: 'nonterm', name: ast.name, prod: tree.prod, + children: [nomAst, ...mapFixUp(tree.children.slice(0, tree.children.length - 1))] + }; + tree = tree.children[tree.children.length - 1]; + } + return nomAst; + } + + // compile nominal AST into an item builder expression function + function translate(ast, builtInProps, builtInFuncs) { + function trans(ast) { + return translate(ast, builtInProps, builtInFuncs); + } + + if (ast.type === 'term') { + switch (ast.token.type) { + case 'nLit': + return ast.token.value; + case 'bLit': + return ast.token.value; + case 'sLit': + return ast.token.value; + case 'ident': + return ast.token.value; + } + } else if (ast.type === 'nonterm') { + switch (ast.name) { + case 'expr': + return trans(ast.children[0]); + case 'exprList': + switch (ast.prod) { + case 0: + return [...trans(ast.children[0]), trans(ast.children[2])]; + case 1: + return [trans(ast.children[0])]; + } + break; + case 'conj': + switch (ast.prod) { + case 0: + return new ConjTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return trans(ast.children[0]); + } + break; + case 'disj': + switch (ast.prod) { + case 0: + return new DisjTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return trans(ast.children[0]); + } + break; + case 'cmpEq': + switch (ast.prod) { + case 0: + return new EqTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return new NeqTerm(trans(ast.children[0]), trans(ast.children[2])); + case 2: + return new ContainsTerm(trans(ast.children[0]), trans(ast.children[2])); + case 3: + return trans(ast.children[0]); + } + break; + case 'cmpRel': + switch (ast.prod) { + case 0: + return new LeqTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return new LtTerm(trans(ast.children[0]), trans(ast.children[2])); + case 2: + return new GtTerm(trans(ast.children[0]), trans(ast.children[2])); + case 3: + return new GeqTerm(trans(ast.children[0]), trans(ast.children[2])); + case 4: + return trans(ast.children[0]); + } + break; + case 'sum': + switch (ast.prod) { + case 0: + return new AddTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return new SubTerm(trans(ast.children[0]), trans(ast.children[2])); + case 2: + return trans(ast.children[0]); + } + break; + case 'prod': + switch (ast.prod) { + case 0: + return new MulTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return new DivTerm(trans(ast.children[0]), trans(ast.children[2])); + case 2: + return trans(ast.children[0]); + } + break; + case 'exp': + switch (ast.prod) { + case 0: + return new ExpTerm(trans(ast.children[0]), trans(ast.children[2])); + case 1: + return trans(ast.children[0]); + } + break; + case 'unary': + switch (ast.prod) { + case 0: + return new NegTerm(trans(ast.children[1])); + case 1: + return new InvTerm(trans(ast.children[1])); + case 2: + return trans(ast.children[0]); + } + break; + case 'prim': + switch (ast.prod) { + case 0: + return new NumLitTerm(ast.children[0].token.value); + case 1: + return new BoolLitTerm(ast.children[0].token.value); + case 2: + return new StrLitTerm(ast.children[0].token.value); + case 3: + const fn = builtInFuncs[ast.children[0].token.id.toLowerCase()]; + if (!fn) { + throw new Error(`Unknown function: ${ast.children[0].token.id}`); + } + return new FnCallTerm(fn, trans(ast.children[2])); + case 4: { + const prop = builtInProps[ast.children[0].token.id.toLowerCase()]; + if (!prop) { + throw new Error(`Unknown property: ${ast.children[0].token.id}`); + } + return new PropTerm(prop); + } + case 5: + return trans(ast.children[1]); + } + break; + case 'args': + switch (ast.prod) { + case 0: + return trans(ast.children[0]); + case 1: + return []; + } + break; + } + } + } + + return class ExprParser { + constructor(builtInProps, builtInFuncs) { + this.builtInProps = builtInProps; + this.builtInFuncs = builtInFuncs; + } + + parse(exprStr) { + const tokens = tokenize(exprStr); + if (tokens.tokens.length <= 1) { + return null; + } + const transAst = takeExpr(tokens, 0); + if (tokens.peek.type !== 'eof') { + throw new Error('Could not parse entire expression!'); + } + const nomAst = fixUp(transAst); + return translate(nomAst, this.builtInProps, this.builtInFuncs); + } + }; +})(); diff --git a/expr_parser.md b/expr_parser.md new file mode 100644 index 0000000..f7e3ffc --- /dev/null +++ b/expr_parser.md @@ -0,0 +1,197 @@ +This file contains notes on how the parser implemented in `expr_parser.js` is designed. +The nominal grammar is as follows: + +``` +expr := conj + +exprList := exprList "," expr + | expr + +conj := conj "&" disj + | disj + +disj := disj "|" cmpEq + | cmpEq + +cmpEq := cmpEq "=" cmpRel + | cmpEq "!=" cmpRel + | cmpEq "?=" cmpRel + | cmpRel + +cmpRel := cmpRel "<=" sum + | cmpRel "<" sum + | cmpRel ">" sum + | cmpRel ">=" sum + | sum + +sum := sum "+" prod + | sum "-" prod + | prod + +prod := prod "*" exp + | prod "/" exp + | exp + +exp := exp "^" unary + | unary + +unary := "-" unary + | "!" unary + | prim + +prim := nLit + | bLit + | sLit + | ident "(" args ")" + | ident + | "(" expr ")" + +args := exprList + | ε +``` + +In order to eliminate left-recursion, the above grammar is transformed into the following: + +``` +expr := conj + +exprList := expr exprListTail + +exprList' := "," expr exprList' + | ε + +conj := disj conj' + +conj' := "&" disj conj' + | ε + +disj := cmpEq disj' + +disj' := "|" cmpEq disj' + | ε + +cmpEq := cmpRel cmpEq' + +cmpEq' := "=" cmpRel cmpEq' + | "!=" cmpRel cmpEq' + | "?=" cmpRel cmpEq' + | ε + +cmpRel := sum cmpRel' + +cmpRel' := "<=" sum cmpRel' + | "<" sum cmpRel' + | ">" sum cmpRel' + | ">=" sum cmpRel' + | ε + +sum := prod sum' + +sum' := "+" prod sum' + | "-" prod sum' + | ε + +prod := exp prod' + +prod' := "*" exp prod' + | "/" exp prod' + | ε + +exp := unary exp' + +exp' := "^" unary exp' + | ε + +unary := "-" unary + | "!" unary + | prim + +prim := nLit + | bLit + | sLit + | ident identTail + | "(" expr ")" + +identTail := "(" args ")" + | ε + +args := exprList + | ε +``` + +The parser itself is a recursive-descent LL(1) parser. +To build the parsing rules, the following `FIRST` and `FOLLOW` sets are computed for the above grammar: + +Nonterminal | FIRST +----------- | ----- +`expr` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`exprList` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`exprList'` | `","`, `ε` +`conj` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`conj'` | `"&"`, `ε` +`disj` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`disj'` | `"\|"`, `ε` +`cmpEq` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`cmpEq'` | `"!="`, `"="`, `"?="`, `ε` +`cmpRel` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`cmpRel'` | `"<"`, `"<="`, `">"`, `">="`, `ε` +`sum` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`sum'` | `"+"`, `"-"`, `ε` +`prod` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`prod'` | `"*"`, `"/"`, `ε` +`exp` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`exp'` | `"^"`, `ε` +`unary` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit` +`prim` | `"("`, `bLit`, `ident`, `nLit`, `sLit` +`identTail` | `"("`, `ε` +`args` | `"!"`, `"("`, `"-"`, `bLit`, `ident`, `nLit`, `sLit`, `ε` + +Nonterminal | FOLLOW +----------- | ------ +`expr` | `")"`, `","`, `$` +`exprList` | `")"` +`exprList'` | `")"` +`conj` | `")"`, `","` +`conj'` | `")"`, `","` +`disj` | `"&"`, `")"`, `","` +`disj'` | `"&"`, `")"`, `","` +`cmpEq` | `"&"`, `")"`, `","`, `"\|"` +`cmpEq'` | `"&"`, `")"`, `","`, `"\|"` +`cmpRel` | `"!="`, `"&"`, `")"`, `","`, `"="`, `"?="`, `"\|"` +`cmpRel'` | `"!="`, `"&"`, `")"`, `","`, `"="`, `"?="`, `"\|"` +`sum` | `"!="`, `"&"`, `")"`, `","`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"\|"` +`sum'` | `"!="`, `"&"`, `")"`, `","`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"\|"` +`prod` | `"!="`, `"&"`, `")"`, `"+"`, `","`, `"-"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"\|"` +`prod'` | `"!="`, `"&"`, `")"`, `"+"`, `","`, `"-"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"\|"` +`exp` | `"!="`, `"&"`, `")"`, `"*"`, `"+"`, `","`, `"-"`, `"/"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"\|"` +`exp'` | `"!="`, `"&"`, `")"`, `"*"`, `"+"`, `","`, `"-"`, `"/"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"\|"` +`unary` | `"!="`, `"&"`, `")"`, `"*"`, `"+"`, `","`, `"-"`, `"/"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"^"`, `"\|"` +`prim` | `"!="`, `"&"`, `")"`, `"*"`, `"+"`, `","`, `"-"`, `"/"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"^"`, `"\|"` +`identTail` | `"!="`, `"&"`, `")"`, `"*"`, `"+"`, `","`, `"-"`, `"/"`, `"<"`, `"<="`, `"="`, `">"`, `">="`, `"?="`, `"^"`, `"\|"` +`args` | `")"` + +Then, the parsing rule table is as follows, where each table entry refers to the production number for the given nonterminal: + +Nonterminal | "!" | "!=" | "&" | "(" | ")" | "*" | "+" | "," | "-" | "/" | "<" | "<=" | "=" | ">" | ">=" | "?=" | "^" | "|" | bLit | ident | nLit | sLit | $ +----------- | --- | ---- | --- | --- | --- | --- | --- | --- | --- | --- | --- | ---- | --- | --- | ---- | ---- | --- | --- | ---- | ----- | ---- | ---- | --- +expr | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +exprList | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +exprList' | - | - | - | - | 1 | - | - | 0 | - | - | - | - | - | - | - | - | - | - | - | - | - | - | 1 +conj | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +conj' | - | - | 0 | - | 1 | - | - | 1 | - | - | - | - | - | - | - | - | - | - | - | - | - | - | 1 +disj | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +disj' | - | - | 1 | - | 1 | - | - | 1 | - | - | - | - | - | - | - | - | - | 0 | - | - | - | - | 1 +cmpEq | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +cmpEq' | - | 1 | 3 | - | 3 | - | - | 3 | - | - | - | - | 0 | - | - | 2 | - | 3 | - | - | - | - | 3 +cmpRel | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +cmpRel' | - | 4 | 4 | - | 4 | - | - | 4 | - | - | 1 | 0 | 4 | 2 | 3 | 4 | - | 4 | - | - | - | - | 4 +sum | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +sum' | - | 2 | 2 | - | 2 | - | 0 | 2 | 1 | - | 2 | 2 | 2 | 2 | 2 | 2 | - | 2 | - | - | - | - | 2 +prod | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +prod' | - | 2 | 2 | - | 2 | 0 | 2 | 2 | 2 | 1 | 2 | 2 | 2 | 2 | 2 | 2 | - | 2 | - | - | - | - | 2 +exp | 0 | - | - | 0 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | - +exp' | - | 1 | 1 | - | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 0 | 1 | - | - | - | - | 1 +unary | 1 | - | - | 2 | - | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 2 | 2 | 2 | 2 | - +prim | - | - | - | 4 | - | - | - | - | - | - | - | - | - | - | - | - | - | - | 1 | 3 | 0 | 2 | - +identTail | - | 1 | 1 | 0 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | 1 | - | - | - | - | 1 +args | 0 | - | - | 0 | 1 | - | - | - | 0 | - | - | - | - | - | - | - | - | - | 0 | 0 | 0 | 0 | 1 diff --git a/items_2.html b/items_2.html index e0f2aa4..27fd286 100644 --- a/items_2.html +++ b/items_2.html @@ -12,70 +12,74 @@
WynnAtlas
WynnAtlas
-WynnAtlas
+The WynnBuilder team has been hard at work giving you the latest and greatest tools for optimizing your most complex Wynncraft builds. Now, we're introducing WynnAtlas, the new, bigger, better, smarter, powerful-er item guide! Featuring an extremely flexible expression language for filtering and sorting items, WynnAtlas' advanced item search system gives build engineers the power to select items with a high degree of granularity. Picking components for your brand-new Divzer WFA build has never been easier!
+The advanced item search interface uses two separate expressions: one for filtering items and the other for sorting them. The idea is that you can filter for items matching a set of criteria that are absolutely necessary for the item you want, then sort the remaining items to find the optimal build component. The expressions themselves are mathematical formulae that compute values from the properties of items, such as their damage values and identifications.
+As an example, suppose you want a helmet granting at least 10 intelligence that maximizes spell damage gain for a build using the Nepta Floodbringer. We would start by writing a filter for helmets with our desired bound on intelligence:
+{prop:type} {op:=} {str:"helmet"} {op:&} {prop:int} {op:>=} {num:10}+
Then, wee would write an expression that computes the amount of damage we get from the helmet. To do this, we first check the damage numbers for the Nepta Floodbringer: assuming we aren't using any powders, we have 96–112 water damage scaled by the super-fast attack speed modifier of 4.3, giving us a total of 4.3 × (96 + 112) ÷ 2 = 447.2. We then multiply in the spell damage and water damage modifiers and add raw spell damage, giving us:
+{prop:sdRaw} {op:+} {num:447.2} {op:*} {op:(}{prop:sdPct} {op:+} {prop:wDamPct}{op:)} {op:/} {num:100}+
And, voilà! In the blink of an eye, we've discovered that Caesura is the best helmet for our criteria, granting 448.14 spell damage.
+Roughly speaking, the expression language just consists of mathematical expressions with simple operations and functions. Each value in the expression is either a number, a boolean (true or false), or a string (a chunk of text). Numbers are floating-point rather than integers, so any kind of fractional value can also be expressed. String literals can use either single- or double-quotes, so the following is true: +
{str:"Hello, world!"} {op:=} {str:'Hello, world!'}+
The filtering expression should produce a boolean in the end, which represents whether an item matches the filter or not, and the sorting expression should produce either a number or a string, which are used to order the items. The sorting expression can even contain multiple sub-expressions separated by semicolons, which are then used to sort the result lexicographically. For example, if I want to sort items by loot bonus, then XP bonus if items have equal loot bonus, I could write:
+{prop:lb}; {prop:xpb}+
The supported mathematical operations include the basic arithmetic operations as well as exponentiation. These operators obey the usual order of operations, with exponentiation having the highest priority. Parentheses are also supported for grouping.
+({num:1} {op:+} {num:2}) {op:-} {num:3} {op:*} ({num:4} {op:/} {num:5}) {op:^} {num:6}+
The supported boolean operations include conjunction (“AND”) and disjunction (“OR”) using the &
and |
symbols, as well as unary inversion (“NOT”) using the !
symbol. Disjunction has higher priority than conjunction, so the following is true:
{bool:true} {op:|} {bool:false} {op:&} {bool:true} {op:|} {bool:false} {op:=} {op:(}{bool:true} {op:|} {bool:false}{op:)} {op:&} {op:(}{bool:true} {op:|} {bool:false}{op:)}+
For comparisons, equality and non-equality are represented by the =
and !=
symbols. The two operands can be of any type, and the result will always be a boolean describing whether the operands are equal. String comparisons are case-insensitive.
{prop:type} {op:=} {str:"wand"} {op:|} {prop:cat} {op:!=} {str:"weapon"}+
The relational comparisons are given by <
, <=
, >=
, and >
. The two operands must be of some comparable type—booleans cannot be compared, so it's an error to pass them to a relational comparison.
{prop:str} {op:>=} {num:20} {op:&} {prop:lvl} {op:<} {num:80}+
In addition to these comparison operators, there's also a “contains” operator ?=
, which checks whether a string contains a given substring or not. This allows for matching more loosely against strings; for example, if I wanted to see all the Hive master weapons, I could use the filter:
{prop:name} {op:?=} {str:"hive infused"}+
Some handy functions are also available, and can be called using a C-like syntax:
+{fn:min}{op:(}{prop:int}{op:,} {num:105} {op:-} {prop:intReq}{op:)} {op:+} {fn:min}{op:(}{prop:def}{op:,} {num:80} {op:-} {prop:defReq}{op:)}+
Try some of these examples out in the item guide! Experimenting with weird and unusual expressions is a great way to get used to the syntax. The more you practice, the faster and more effective you'll be at using WynnAtlas to optimize your powerful Wynncraft builds!
+What follows are lists of existing built-in properties and functions. Note that some aliases are omitted for properties with way too many aliases. If you want, you can also check out the source code to see the actual declarations for all the built-in objects.
+You can check out the implementation notes for the expression parser, as well as the parser code itself, over at the WynnBuilder GitHub repository. You can also ask around on the Atlas Inc. Discord server if you want more details.
+