From 13a27fbc2e68366e3861ff1607f0a9c75649c71d Mon Sep 17 00:00:00 2001 From: Lutz Roeder Date: Sun, 7 May 2023 09:48:38 -0700 Subject: [PATCH] Add MLIR support (#1044) (#1088) --- source/mlir.js | 1357 +++++++++++++++++++++++++++++++++++++++++++++- test/models.json | 4 +- 2 files changed, 1341 insertions(+), 20 deletions(-) diff --git a/source/mlir.js b/source/mlir.js index eed05c5760..c699634549 100644 --- a/source/mlir.js +++ b/source/mlir.js @@ -1,24 +1,14 @@ +// Experimental +// contributor @tucan9389 + var mlir = {}; var text = require('./text'); mlir.ModelFactory = class { - match(context) { - const stream = context.stream; - if (stream) { - const reader = text.Reader.open(stream, 2048); - for (;;) { - const line = reader.read(); - if (line === undefined) { - break; - } - if (line.indexOf('module ') !== -1) { - return 'mlir'; - } - } - } - return null; + match(/* context */) { + return 'mlir'; } open(context) { @@ -33,9 +23,9 @@ mlir.ModelFactory = class { mlir.Model = class { - constructor(/* obj */) { + constructor(obj) { this._format = 'MLIR'; - this._graphs = []; + this._graphs = obj.functions.map(func => new mlir.Graph(func, '')); } get format() { @@ -47,10 +37,833 @@ mlir.Model = class { } }; +mlir.Graph = class { + + constructor(func, group) { + this._inputs = []; // [mlir.Parameter] + this._outputs = []; // [mlir.Parameter] + this._nodes = []; // [mlir.Node] + const valueType = (type) => { + if (type === undefined) { + return null; + } + // eg. tensor + if (type.startsWith('tensor<')) { + const shapeString = type.substring(7, type.length - 1); + if (!/^[0-9xfiq?*]+$/i.test(shapeString)) { + return type; + } + const parts = shapeString.split('x'); + const dataType = parts[parts.length - 1]; + const shape = parts + .slice(0, -1) + .map((dimension) => { + const parsedDimension = parseInt(dimension.trim()); + return isNaN(parsedDimension) ? '?' : parsedDimension; + }); + return new mlir.TensorType(dataType, new mlir.TensorShape(shape)); + } + return type; + }; + // inputs of function + for (let i = 0; i < func.inputs.length; i++) { + const input = func.inputs[i]; + const inputType = func.inputTypes[i]; + const type = valueType(inputType); + const argument = new mlir.Argument(input, type, "input desc", null); + const parameter = new mlir.Parameter(input, true, [ argument ]); + this._inputs.push(parameter); + } + // outputs of function + for (let i = 0; i < func.outputTypes.length; i++) { + const output = "%return" + "/" + i; + const outputType = func.outputTypes[i]; + const type = valueType(outputType); + const argument = new mlir.Argument(output, type, "output desc", null); + const parameter = new mlir.Parameter(output, true, [ argument ]); + this._outputs.push(parameter); + } + // operations + // args is map of edges. args will be converted to mlir.Arguemnts. + const args = new Map(); + const arg = (name) => { + if (!args.has(name)) { + args.set(name, { name: name, to: [], from: [] }); + } + return args.get(name); + }; + // operations - setup arguments + const operations = func.operations.map((op) => { + const operation = { + type: op.name, + attributes: {}, + inputs: [], + outputs: [], + delete: false, + }; + // TODO: convert attributes to proper types + operation.attributes = op.attributes; + // for (const entry of Object.entries(op.attributes)) { + // const key = entry[0]; + // const value = entry[1]; + // operation.attributes[key] = convertValue(value); + // } + for (let j = 0; j < (op.inputs ? op.inputs.length : 0); j++) { + const input = op.inputs[j]; + const inputType = op.inputTypes[j]; + const value = arg(input); + value.to.push(operation); + const args = [{ name: input, value: inputType }]; + operation.inputs.push({ + name: input, + arguments: args + }); + } + for (let j = 0; j < (op.outputs ? op.outputs.length : 0); j++) { + const output = op.outputs[j]; + const outputType = op.outputTypes[j]; + const value = arg(output); + value.type = valueType(outputType); + value.from.push(operation); + operation.outputs.push({ + name: output, + arguments: [value] + }); + } + return operation; + }); + + // // operations - constant ops + // for (const op of operations) { + // if (op.type === 'const' && op.inputs.length === 0 && + // op.outputs.length === 1 && op.outputs[0].arguments.length === 1) { + // const argument = op.outputs[0].arguments[0]; + // if (op.attributes && op.attributes.val) { + // const type = argument.type; + // const data = op.attributes.val; + // if (data instanceof Uint8Array && data.length === 2 && + // type.dataType === 'float16' && type.shape.dimensions.length === 0) { + // const view = new DataView(data.buffer, data.byteOffset, data.byteLength); + // argument.value = view.getFloat16(0, true); + // } else { + // argument.value = data; + // } + // argument.const = true; + // op.delete = true; + // } + // } + // } + + // // + // for (const op of operations) { + // for (const input of op.inputs) { + // if (input.arguments.length > 1 && input.arguments.some((argument) => argument.const)) { + // if (input.arguments.every((argument) => argument.value instanceof mlir.Tensor)) { + // continue; + // } + // for (const argument of input.arguments) { + // for (const from of argument.from) { + // from.delete = false; + // } + // delete argument.value; + // } + // } + // } + // } + + // for (const op of operations) { + // if (op.delete) { + // continue; + // } + // op.inputs = op.inputs.filter((input) => { + // if (input.arguments.every((argument) => argument.value === undefined || argument.value instanceof coreml.Tensor)) { + // return true; + // } + // if (input.arguments.length === 1) { + // const argument = input.arguments[0]; + // op.attributes[input.name] = argument.value; + // return false; + // } + // op.attributes[input.name] = input.arguments.map((argument) => argument.value[0]); + // return false; + // }); + // } + const tensors = new Map(); + const tensor = (arg) => { + if (!tensors.has(arg.name)) { + tensors.set(arg.name, new mlir.Argument(arg.name, arg.type, null, arg.value)); + } + return tensors.get(arg.name); + }; + for (const input of this._inputs) { + for (const arg of input.arguments) { + tensors.set(arg.name, arg); + } + } + for (const output of this._outputs) { + for (const arg of output.arguments) { + tensors.set(arg.name, arg); + } + } + for (const op of operations) { + if (op.delete) { + continue; + } + op.inputs = op.inputs.map((input) => new mlir.Parameter(input.name, true, input.arguments.map((argument) => tensor(argument)))); + op.outputs = op.outputs.map((output) => new mlir.Parameter(output.name, true, output.arguments.map((argument) => tensor(argument)))); + } + for (const op of operations.filter((op) => !op.delete)) { + const type = op.type; // 'program:' + op.type; + // const metadata = this._metadata.type(type); + // if (metadata && Array.isArray(metadata.inputs)) { + // let index = 1; + // const map = new Map(metadata.inputs.map((input) => [ input.name, index++ ])); + // op.inputs.sort((a, b) => (map.get(a.name) || map.size) - (map.get(b.name) || map.size)); + // } + const node = new mlir.Node(/*this._metadata, */group, type, null, null, op.attributes, op.inputs, op.outputs); + this._nodes.push(node); + } + } + + get inputs() { + return this._inputs; + } + + get outputs() { + return this._outputs; + } + + get nodes() { + return this._nodes; + } +}; + +mlir.Parameter = class { + + constructor(name, visible, args) { + this._name = name; // string + this._visible = visible; // bool + this._arguments = args; // [mlir.Argument] + } + + get name() { + return this._name; + } + + get visible() { + return this._visible == false ? false : true; + } + + get arguments() { + return this._arguments; + } +}; + +mlir.Argument = class { + + constructor(name, type, description, initializer) { + if (typeof name !== 'string') { + throw new mlir.Error("Invalid argument identifier '" + JSON.stringify(name) + "'."); + } + this._name = name; // string + this._type = type || null; // mlir.TensorType + this._description = description || null; + this._initializer = initializer || null; + } + + get name() { + return this._name; + } + + set name(value) { + this._name = value; + } + + get type() { + if (this._initializer) { + return this._initializer.type; + } + return this._type; + } + + set type(value) { + this._type = value; + } + + get description() { + return this._description; + } + + set description(value) { + this._description = value; + } + + get quantization() { + if (this._initializer) { + return this._initializer.quantization; + } + return null; + } + + get initializer() { + return this._initializer; + } +}; + +mlir.Node = class { + + constructor(group, type, name, description, attributes, inputs, outputs) { + if (!type) { + throw new Error('Undefined node type.'); + } + if (group) { + this._group = group; + } + this._type = { name: type || '' }; // string (metadata.type(type) || { name: type } + this._name = name || ''; // string + this._description = description || ''; // string + this._inputs = inputs || []; // [mlir.Parameter] + this._outputs = outputs || []; // [mlir.Parameter] + this._attributes = []; // [mlir.Attribute] + if (attributes) { + for (const key of Object.keys(attributes)) { + // const schema = {}; // metadata.attribute(type, key); + const value = attributes[key]; + const attribute = new mlir.Attribute(key, value); + this._attributes.push(attribute); + } + } + } + + get type() { + return this._type; + } + + get name() { + return this._name; + } + + get description() { + return this._description; + } + + get metadata() { + return this._metadata; + } + + get group() { + return this._group ? this._group : null; + } + + get inputs() { + return this._inputs; + } + + get outputs() { + return this._outputs; + } + + get attributes() { + return this._attributes; + } +}; + +mlir.Attribute = class { + + constructor(name, value) { + this._name = name; + this._type = 'string'; + this._value = value; + this._visible = true; + } + + get name() { + return this._name; + } + + get type() { + return this._type; + } + + get value() { + return this._value; + } + + get visible() { + return this._visible == false ? false : true; + } +}; + +mlir.Tensor = class { + + constructor(type, data) { + this._type = type; // mlir.TensorType + this._data = data; + } + + get type() { + return this._type; + } + + get quantization() { + // TODO + return null; + } + + get layout() { + switch (this._type.dataType) { + case 'float32': return '|'; + default: return '<'; + } + } + + get values() { + return this._data; + } +}; + +mlir.TensorType = class { + + constructor(dataType, shape) { + this._dataType = mlir.Utility.dataType(dataType); // string + this._shape = shape || new mlir.TensorShape([]); // mlir.TensorShape + } + + get dataType() { + return this._dataType; + } + + get shape() { + return this._shape; + } + + toString() { + return this.dataType + this._shape.toString(); + } +}; + +mlir.TensorShape = class { + + constructor(dimensions) { + this._dimensions = dimensions; + } + + get dimensions() { + return this._dimensions; + } + + toString() { + if (!this._dimensions || this._dimensions.length == 0) { + return ''; + } + return '[' + this._dimensions.map((dimension) => dimension.toString()).join(',') + ']'; + } +}; + +mlir.TokenType = { + IDENTIFIER: 'IDENTIFIER', + BOOLEAN_LITERAL: 'BOOLEAN_LITERAL', + INTEGER_LITERAL: 'INTEGER_LITERAL', + HEXADECIMAL_LITERAL: 'HEXADECIMAL_LITERAL', + FLOAT_LITERAL: 'FLOAT_LITERAL', + STRING_LITERAL: 'STRING_LITERAL', + SYMBOL_REF_ID: 'SYMBOL_REF_ID', + TYPE: 'TYPE', + DENSE: 'DENSE', + VALUE_ID: '%', + CARET_ID: '^', + COLON: ':', + COMMA: ',', + EQUAL: '=', + LPAREN: '(', + RPAREN: ')', + ARROW: '->', + LBRACKET: '[', + RBRACKET: ']', + LBRACE: '{', + RBRACE: '}', + LESS_THAN: '<', + GREATER_THAN: '>', + KEYWORD: 'KEYWORD', + EOF: 'EOF', +}; + +mlir.Token = class { + + constructor(type, value) { + this.type = type; + this.value = value; + } +}; + mlir.Tokenizer = class { constructor(decoder) { this._decoder = decoder; + this._current = this._decoder.decode(); + this._next = this._decoder.decode(); + } + + next() { + while (this._current) { + if (this._current === ' ' || this._current === '\t' || this._current === '\n' || this._current === '\r' || this._current === '\f') { + this._skipWhitespace(); + continue; + } + if (this._current === '/') { + this._skipComment(); + continue; + } + if (/[0-9]/.test(this._current)) { + let result = ''; + const type = mlir.TokenType.INTEGER_LITERAL; + while (this._current && /[0-9]/.test(this._current)) { + result += this._read(); + } + if (this._current === 'x') { + // Read the rest of the shape + do { + result += this._read(); + } while (this._current && /[0-9x]/.test(this._current)); + return new mlir.Token(mlir.TokenType.SHAPE, result); + } + return new mlir.Token(type, parseInt(result, 10)); + } + if (this._current === '.') { + if (/[0-9]/.test(this._peek())) { + return this._number(); + } + return new mlir.Token(mlir.TokenType.KEYWORD, '.'); + } + if (this._current === '-') { + if (/[0-9]/.test(this._peek())) { + return this._number(); + } else if (this._peek() === '>') { + this._read(); + this._read(); + return new mlir.Token(mlir.TokenType.ARROW, '->'); + } + this._read(); + return new mlir.Token(mlir.TokenType.KEYWORD, '-'); + } + if (this._current === '+') { + if (/[0-9]/.test(this._peek())) { + return this._number(); + } + this._read(); + return new mlir.Token(mlir.TokenType.KEYWORD, '+'); + } + if (this._current === '"') { + return this._stringLiteral(); + } + if (/[a-zA-Z_$]/.test(this._current) || /[-.]/.test(this._current)) { + return this._identifier(); + } + if (this._current === '@') { + return this._symbolRefId(); + } + if (this._current === '%') { + return this._valueId(); + } + if (this._current === '^') { + return this._caretId(); + } + if (this._current === '=') { + if (this._peek() === '=') { + this._read(); + this._read(); + return new mlir.Token(mlir.TokenType.EQUAL_EQUAL, '=='); + } + this._read(); + return new mlir.Token(mlir.TokenType.EQUAL, '='); + + } + if (this._current === ':') { + if (this._peek() === ':') { + this._read(); + this._read(); + return new mlir.Token(mlir.TokenType.DOUBLE_COLON, '::'); + } + this._read(); + return new mlir.Token(mlir.TokenType.COLON, ':'); + } + if (this._current === ',') { + this._read(); + return new mlir.Token(mlir.TokenType.COMMA, ','); + } + if (this._current === '(') { + this._read(); + return new mlir.Token(mlir.TokenType.LPAREN, '('); + } + if (this._current === ')') { + this._read(); + return new mlir.Token(mlir.TokenType.RPAREN, ')'); + } + if (this._current === '{') { + this._read(); + return new mlir.Token(mlir.TokenType.LBRACE, '{'); + } + if (this._current === '}') { + this._read(); + return new mlir.Token(mlir.TokenType.RBRACE, '}'); + } + if (this._current === '[') { + this._read(); + return new mlir.Token(mlir.TokenType.LBRACKET, '['); + } + if (this._current === ']') { + this._read(); + return new mlir.Token(mlir.TokenType.RBRACKET, ']'); + } + if (this._current === '<') { + this._read(); + return new mlir.Token(mlir.TokenType.LESS_THAN, '<'); + } + if (this._current === '>') { + this._read(); + return new mlir.Token(mlir.TokenType.GREATER_THAN, '>'); + } + const result = this._read(); + return new mlir.Token(mlir.TokenType.KEYWORD, result); + } + return new mlir.Token(mlir.TokenType.EOF, null); + } + + _read() { + const value = this._current; + this._current = this._next; + this._next = this._decoder.decode(); + return value; + } + + _peek() { + return this._next; + } + + _skipWhitespace() { + while (this._current === ' ' || this._current === '\t' || this._current === '\n' || this._current === '\r' || this._current === '\f') { + this._read(); + } + } + + _skipComment() { + if (this._current === '/') { + this._read(); + if (this._current === '/') { + while (this._current && this._current !== '\n') { + this._read(); + } + this._skipWhitespace(); + this._skipComment(); + } else if (this._current === '*') { + while (this._current) { + this._read(); + if (this._current === '*') { + this._read(); + if (this._current === '/') { + this._read(); + break; + } + } + } + this._skipWhitespace(); + this._skipComment(); + } + } + } + + _number() { + let result = ''; + let type = mlir.TokenType.INTEGER_LITERAL; + while (this._current && /[0-9]/.test(this._current)) { + result += this._read(); + } + if (this._current === 'x') { + result += this._read(); + type = mlir.TokenType.HEXADECIMAL_LITERAL; + while (this._current && /[0-9a-fA-F]/.test(this._current)) { + result += this._read(); + } + } else if (this._current === '.') { + result += this._read(); + type = mlir.TokenType.FLOAT_LITERAL; + while (this._current && /[0-9]/.test(this._current)) { + result += this._read(); + } + if (this._current === 'e' || this._current === 'E') { + result += this._read(); + if (this._current === '+' || this._current === '-') { + result += this._read(); + } + while (this._current && /[0-9]/.test(this._current)) { + result += this._read(); + } + if (type === mlir.TokenType.INTEGER_LITERAL && /[.eE]/.test(this._current)) { + type = mlir.TokenType.FLOAT_LITERAL; + } + if (type === mlir.TokenType.FLOAT_LITERAL && !/[.eE]/.test(this._current)) { + return new mlir.Token(type, parseFloat(result)); + } + if (type === mlir.TokenType.HEXADECIMAL_LITERAL && !/[x]/.test(this._current)) { + return new mlir.Token(type, parseInt(result, 16)); + } + return new mlir.Token(type, result); + } + } + + return new mlir.Token(type, parseInt(result, 10)); + } + + _stringLiteral() { + let result = ''; + this._read(); + while (this._current && this._current !== '"') { + if (this._current === '\\') { + this._read(); + switch (this._current) { + case 'n': + result += '\n'; + break; + case 'r': + result += '\r'; + break; + case 't': + result += '\t'; + break; + default: + result += this._current; + break; + } + } else { + result += this._current; + } + this._read(); + } + if (this._current === '"') { + this._read(); + return new mlir.Token(mlir.TokenType.STRING_LITERAL, result); + } + throw new Error('Unterminated string literal'); + } + + _identifier() { + let result = ''; + let opened = 0; + let wasOpened = false; + while (this._current) { + if (!opened) { + if (this._current && + (/[a-zA-Z_$<>\-.*]/.test(this._current) || + /[0-9]/.test(this._current))) { + if (this._current === '<') { + opened += 1; + wasOpened = true; + } + result += this._read(); + } else { + break; + } + } else if (!this._current) { + break; + } else if (this._current === '>') { + result += this._read(); + opened -= 1; + if (opened === 0) { + break; + } + } else { + if (this._current === '<') { + opened += 1; + } + result += this._read(); + } + } + + if (wasOpened) { + if (result.startsWith('dense')) { + return new mlir.Token(mlir.TokenType.DENSE, result); + } + return new mlir.Token(mlir.TokenType.TYPE, result); + + } + + if (result.endsWith('func')) { + return new mlir.Token(mlir.TokenType.KEYWORD, result); + } + + switch (result) { + case 'module': + case 'func': + case 'loc': + return new mlir.Token(mlir.TokenType.KEYWORD, result); + case 'true': + case 'false': + return new mlir.Token(mlir.TokenType.BOOLEAN_LITERAL, result === 'true'); + default: + return new mlir.Token(mlir.TokenType.IDENTIFIER, result); + } + } + + + _symbolRefId() { + let result = '@'; + this._read(); + if (this._current === '"') { + result += this._stringLiteral().value; + } else { + while ( + this._current && + (/[a-zA-Z_$]/.test(this._current) || + /[0-9]/.test(this._current) || + /[-.]/.test(this._current)) + ) { + result += this._read(); + } + if (this._current === ':' && this._peek() === ':') { + result += this._read(); + result += this._read(); + result += this._symbolRefId().value; + } + } + return new mlir.Token(mlir.TokenType.SYMBOL_REF_ID, result); + } + + _valueId() { + let result = ''; + if (this._current === '%') { + result = '%'; + } else if (this._current === '$') { + result = '$'; + } + this._read(); + while (this._current) { + if (/[a-zA-Z_$]/.test(this._current) || /[0-9]/.test(this._current) || /[-.#]/.test(this._current)) { + result += this._read(); + } else if (/[:]/.test(this._current) && /[0-9]/.test(this._next)) { // %myid:3 case + result += this._read(); + } else { + break; + } + } + return new mlir.Token(mlir.TokenType.VALUE_ID, result); + } + + _caretId() { + let result = '^'; + this._read(); + if (this._current === ':' && this._peek() !== ':') { + result += this._read(); + return new mlir.Token(mlir.TokenType.CARET_ID, result); + } + while (this._current && (/[a-zA-Z_$]/.test(this._current) || /[0-9]/.test(this._current) || /[-.]/.test(this._current))) { + result += this._read(); + } + if (this._current === ':' && this._peek() === ':') { + result += this._read(); + result += this._read(); + result += this._caretId().value; + } + return new mlir.Token(mlir.TokenType.CARET_ID, result); } }; @@ -58,10 +871,518 @@ mlir.Parser = class { constructor(decoder) { this._tokenizer = new mlir.Tokenizer(decoder); + this._current = this._tokenizer.next(); + this._next = this._tokenizer.next(); } read() { - throw new mlir.Error('MLIR support is not implemented.'); + const hasModule = this._current.type === mlir.TokenType.KEYWORD && this._current.value === 'module'; + let attributes = {}; + if (hasModule) { + this._eat(mlir.TokenType.KEYWORD, 'module'); + // Attributes + if (this._current.value === 'attributes') { + this._eat(mlir.TokenType.IDENTIFIER, 'attributes'); + attributes = Object.assign(attributes, this._parseAttribute()); + } + this._eat(mlir.TokenType.LBRACE); + } + const graph = { + functions: [], + operations: [], + attributes: attributes, + }; + // functions or operations + const terminal = hasModule ? mlir.TokenType.RBRACE : mlir.TokenType.EOF; + while (this._current.type !== terminal) { + if (this._current.type === mlir.TokenType.KEYWORD && this._current.value.endsWith('func')) { + // function + const func = this._parseFunction(); + graph.functions.push(func); + } else { + // operation + const op = this._parseOperation(); + graph.operations.push(op); + } + } + if (hasModule) { + this._eat(mlir.TokenType.RBRACE); + } + return graph; + } + + _parseFunction() { + // func keyword + this._eat(mlir.TokenType.KEYWORD); + let visibility = null; + if (this._current.type != mlir.TokenType.SYMBOL_REF_ID) { + visibility = this._current.value; + this._eat(this._current.type); + } + const name = this._parseFunctionName(); + const inputs = this._parseFunctionInputs(); + let attributes = {}; + // attributes + if (this._current.value === 'attributes') { + this._eat(mlir.TokenType.IDENTIFIER, 'attributes'); + attributes = Object.assign(attributes, this._parseAttribute()); + } + let outputs = {}; + if (this._current.type === mlir.TokenType.ARROW) { + outputs = Object.assign(outputs, this._parseFunctionOutputs()); + } + // attributes + if (this._current.value === 'attributes') { + this._eat(mlir.TokenType.IDENTIFIER, 'attributes'); + attributes = Object.assign(attributes, this._parseAttribute()); + } + this._eat(mlir.TokenType.LBRACE); + // operations + const operations = []; + while (this._current.type !== mlir.TokenType.RBRACE) { + const operation = this._parseOperation(); + operations.push(operation); + } + this._eat(mlir.TokenType.RBRACE); + return { + name: name, + inputs: inputs.map(input => input.name), + inputTypes: inputs.map(input => input.type), + outputTypes: outputs, + operations: operations, + attributes: attributes, + visibility: visibility, + }; + } + + _parseFunctionName() { + const name = this._current.value; + this._eat(mlir.TokenType.SYMBOL_REF_ID); + return name; + } + + _parseFunctionInputs() { + this._eat(mlir.TokenType.LPAREN); + const inputs = []; + while (this._current.type !== mlir.TokenType.RPAREN) { + const input = { + name: this._current.value, + }; + this._eat(mlir.TokenType.VALUE_ID); + this._eat(mlir.TokenType.COLON); + input.type = this._current.value; + if (this._current.type === mlir.TokenType.TYPE) { + this._eat(mlir.TokenType.TYPE); + } else if (this._current.type === mlir.TokenType.IDENTIFIER) { + this._eat(mlir.TokenType.IDENTIFIER); + } + // attribute + if (this._current.type === mlir.TokenType.LBRACE) { + input.attributes = this._parseAttribute(); + } + inputs.push(input); + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + this._eat(mlir.TokenType.RPAREN); + return inputs; + } + + _parseFunctionOutputs() { + this._eat(mlir.TokenType.ARROW); + const outputs = []; + if (this._current.type === mlir.TokenType.LPAREN) { + this._eat(mlir.TokenType.LPAREN); + while (this._current.type !== mlir.TokenType.RPAREN) { + const output = { + type: this._current.value, + }; + if (this._current.type === mlir.TokenType.TYPE) { + this._eat(mlir.TokenType.TYPE); + } else if (this._current.type === mlir.TokenType.IDENTIFIER) { + this._eat(mlir.TokenType.IDENTIFIER); + } + // attribute + if (this._current.type === mlir.TokenType.LBRACE) { + output.attributes = this._parseAttribute(); + } + outputs.push(output); + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + this._eat(mlir.TokenType.RPAREN); + } else { + const output = { + type: this._current.value, + }; + if (this._current.type === mlir.TokenType.TYPE) { + this._eat(mlir.TokenType.TYPE); + } else if (this._current.type === mlir.TokenType.IDENTIFIER) { + this._eat(mlir.TokenType.IDENTIFIER); + } + outputs.push(output); + } + return outputs; + } + + _parseOperation() { + // %3 + const outputs = this._parseReturnValues(); + // = + if (this._current.type == mlir.TokenType.EQUAL) { + this._eat(mlir.TokenType.EQUAL); + } + // "add" + const operationName = this._parseOperationName(); + if (this._current.type === mlir.TokenType.RBRACE) { + // early return + return { + outputs: outputs, + name: operationName, + }; + } + const skipSymbolBetween = (openingTokenType, closingTokenType) => { + if (this._current.type === openingTokenType) { + this._eat(openingTokenType); + let count = 1; + while (count > 0) { + if (this._current.type === openingTokenType) { + count++; + } else if (this._current.type === closingTokenType) { + count--; + } + this._eat(this._current.type); + } + } + }; + // (%a, %b) + // condition: start with `(%`, `%`, or `()` + const { inputs } = this._parseInputArguments(); + // successor-list? + // condition: start with `[`, end with `]` + if (this._current.type === mlir.TokenType.LBRACKET) { + skipSymbolBetween(mlir.TokenType.LBRACKET, mlir.TokenType.RBRACKET); // TODO + } + // dictionary-properties? + // condition: start with `<`, end with `>` + if (this._current.type === mlir.TokenType.LESS_THAN) { + skipSymbolBetween(mlir.TokenType.LESS_THAN, mlir.TokenType.GREATER_THAN); // TODO + } + // region-list? + // condition: start with `({^`, or (operation, end with `)` + if (this._current.type === mlir.TokenType.LPAREN && this._next.type === mlir.TokenType.LBRACE) { + skipSymbolBetween(mlir.TokenType.LPAREN, mlir.TokenType.RPAREN); // TODO + } + // dictionary-attribute? + // condition: start with `{`, end with `}` + let attributes = {}; + attributes = Object.assign(attributes, this._parseAttribute()); + // : (f32, tensor<1xf32>) + let inputTypes = []; + if (this._current.type === mlir.TokenType.COLON) { + this._eat(mlir.TokenType.COLON); + ({ inputTypes } = this._parseInputArgumentTypes()); + } + const outputTypes = []; + if (operationName.endsWith('constant') && this._current.type !== mlir.TokenType.ARROW) { + // constant + const result = { + name: operationName, + attributes: attributes, + // data: this._parseConstantData(), + outputs: outputs, + outputTypes: outputTypes, + isConstant: true, + }; + return result; + } + // -> f32 + if (this._current.type === mlir.TokenType.ARROW) { + this._eat(mlir.TokenType.ARROW); + outputTypes.push(...this._parseOutputType()); + } + let body = null; + if (this._current.type === mlir.TokenType.LBRACE) { + body = this._parseOperationBody(); + } + attributes = Object.assign(attributes, this._parseAttribute()); + const result = { + name: operationName, + attributes: attributes, + inputs: inputs, + inputTypes: inputTypes, + outputs: outputs, + outputTypes: outputTypes, + body: body, + }; + return result; + } + + _parseReturnValues() { + const outputs = []; + if (this._current.type === mlir.TokenType.LPAREN) { + this._eat(mlir.TokenType.LPAREN); + while (this._current.type !== mlir.TokenType.RPAREN) { + if (this._current.type === mlir.TokenType.VALUE_ID) { + outputs.push(this._current.value); + this._eat(mlir.TokenType.VALUE_ID); + } + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + this._eat(mlir.TokenType.RPAREN); + } else if (this._current.type === mlir.TokenType.VALUE_ID) { + outputs.push(this._current.value); + this._eat(mlir.TokenType.VALUE_ID); + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + while (this._current.type === mlir.TokenType.VALUE_ID) { + outputs.push(this._current.value); + this._eat(mlir.TokenType.VALUE_ID); + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + } + } + const result = []; + outputs.forEach((output) => { + if (output.split(':').length == 2) { + const [valueId, length] = output.split(':'); + for (let i = 0; i < length; i++) { + result.push(valueId + '#' + i); + } + } else { + result.push(output); + } + }); + return result; + } + + _parseOperationName() { + let value; + switch (this._current.type) { + case mlir.TokenType.STRING_LITERAL: + value = this._current.value; + this._eat(mlir.TokenType.STRING_LITERAL); + break; + case mlir.TokenType.IDENTIFIER: + value = this._current.value; + this._eat(mlir.TokenType.IDENTIFIER); + if (this._current.type === mlir.TokenType.IDENTIFIER) { + value += this._current.value; + this._eat(mlir.TokenType.IDENTIFIER); + } + break; + default: + throw new Error("Unexpected token for operation name: " + JSON.stringify(this._current) + "."); + } + return value; + } + + _parseInputArguments() { + const inputs = []; + if (this._current.type === mlir.TokenType.LPAREN) { + this._eat(mlir.TokenType.LPAREN); + } + while (this._current.type !== mlir.TokenType.RPAREN && + this._current.type !== mlir.TokenType.COLON && + this._current.type !== mlir.TokenType.ARROW && + this._current.type !== mlir.TokenType.RBRACE && + this._current.type !== mlir.TokenType.IDENTIFIER && + this._current.type !== mlir.TokenType.STRING_LITERAL) { + if (this._current.type === mlir.TokenType.VALUE_ID) { + inputs.push(this._current.value); + this._eat(mlir.TokenType.VALUE_ID); + } else if (this._current.type === mlir.TokenType.DENSE) { + inputs.push(this._current.value); + this._eat(mlir.TokenType.DENSE); + return { inputs }; + } + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + if (this._current.type === mlir.TokenType.RPAREN) { + this._eat(mlir.TokenType.RPAREN); + } + return { inputs }; + } + + _parseInputArgumentTypes() { + const inputTypes = []; + if (this._current.type === mlir.TokenType.LPAREN) { + this._eat(mlir.TokenType.LPAREN); + } + while (this._current.type === mlir.TokenType.TYPE || (this._current.type === mlir.TokenType.IDENTIFIER && this._current.value === 'none')) { + inputTypes.push(this._current.value); + this._eat(this._current.type); + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + if (this._current.type === mlir.TokenType.RPAREN) { + this._eat(mlir.TokenType.RPAREN); + } + return { inputTypes }; + } + + _parseOutputArguments() { + const outputs = []; + const outputTypes = []; + this._eat(mlir.TokenType.LPAREN); + while (this._current.type !== mlir.TokenType.RPAREN) { + if (this._current.type === mlir.TokenType.VALUE_ID) { + outputs.push(this._current.value); + this._eat(mlir.TokenType.VALUE_ID); + } + if (this._current.type === mlir.TokenType.COLON) { + this._eat(mlir.TokenType.COLON); + outputTypes.push(this._current.value); + this._eat(mlir.TokenType.TYPE); + } + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + this._eat(mlir.TokenType.RPAREN); + return { outputs, outputTypes }; + } + + _parseOutputType() { + const outputTypes = []; + if (this._current.type === mlir.TokenType.LPAREN) { + this._eat(mlir.TokenType.LPAREN); + while (this._current.type !== mlir.TokenType.RPAREN) { + outputTypes.push(this._current.value); + if (this._current.type === mlir.TokenType.TYPE) { + this._eat(mlir.TokenType.TYPE); + } else if (this._current.type === mlir.TokenType.IDENTIFIER) { + if (this._current.value === 'none' || /[^f\\d+$]/.test(this._current.value) || /[^i\\d+$]/.test(this._current.value)) { + this._eat(mlir.TokenType.IDENTIFIER); + } + } + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + this._eat(mlir.TokenType.RPAREN); + } else { + outputTypes.push(this._current.value); + if (this._current.type === mlir.TokenType.TYPE) { + this._eat(mlir.TokenType.TYPE); + } else if (this._current.type === mlir.TokenType.IDENTIFIER) { + if (this._current.value === 'none' || /[^f\\d+$]/.test(this._current.value) || /[^i\\d+$]/.test(this._current.value)) { + this._eat(mlir.TokenType.IDENTIFIER); + } + } + } + return outputTypes; + } + + _parseOperationBody() { + let braceCount = 0; + this._eat(mlir.TokenType.LBRACE); + braceCount++; + let content = '{ '; + while (braceCount > 0) { + if (this._current.type === mlir.TokenType.LBRACE) { + braceCount++; + } else if (this._current.type === mlir.TokenType.RBRACE) { + braceCount--; + } + if (braceCount > 0) { + content += this._current.value; + if (this._current.type === mlir.TokenType.LBRACE || this._current.type === mlir.TokenType.RBRACE) { + content += '\n'; + } else if (this._current.type !== mlir.TokenType.WHITESPACE) { + content += ' '; + } + } + this._eat(this._current.type); + } + content += '}'; + return content; + } + + _parseAttribute() { + const attributes = {}; + if (this._current.type === mlir.TokenType.LBRACE) { + this._eat(mlir.TokenType.LBRACE); + while (this._current.type !== mlir.TokenType.RBRACE) { + if (this._current.type !== mlir.TokenType.IDENTIFIER) { + throw new Error("Unexpected token '" + this._current.value + "' when parsing operation attribute."); + } + const name = this._current.value; + this._eat(mlir.TokenType.IDENTIFIER); + if (this._current.type === mlir.TokenType.EQUAL) { + this._eat(mlir.TokenType.EQUAL); + const value = this._parseAttributeValue(); + attributes[name] = value; + } else { + attributes[name] = name; + } + if (this._current.type === mlir.TokenType.COMMA) { + this._eat(mlir.TokenType.COMMA); + } + } + this._eat(mlir.TokenType.RBRACE); + } + return attributes; + } + + _parseAttributeValue() { + let value = ''; + let openingCount = 0; + while (!(openingCount === 0 && (this._current.type === mlir.TokenType.COMMA || this._current.type === mlir.TokenType.RBRACE))) { + switch (this._current.type) { + case mlir.TokenType.LBRACKET: + case mlir.TokenType.LBRACE: + case mlir.TokenType.LPAREN: + openingCount++; + break; + case mlir.TokenType.RBRACKET: + case mlir.TokenType.RBRACE: + case mlir.TokenType.RPAREN: + openingCount--; + break; + default: + break; + } + value += this._current.value + ' '; + this._eat(this._current.type); + } + return value.trim(); + } + + _eat(type, value) { + if (this._current.type !== type) { + throw new Error("Expected token of type '" + type + "', but got '" + this._current.type + "'."); + } + if (value && this._current.value !== value) { + throw new Error("Expected token with value '" + value + "', but got '" + this._current.value + "'."); + } + this._current = this._next; + this._next = this._tokenizer.next(); + } +}; + +mlir.Utility = class { + + static dataType(value) { + switch (value) { + case 'f16': return 'float16'; + case 'f32': return 'float32'; + case 'f64': return 'float64'; + case 'i16': return 'int16'; + case 'i32': return 'int32'; + case 'i64': return 'int64'; + case 'i1': return 'boolean'; + default: throw new mlir.Error("Unknown data type '" + value + "'."); + } } }; diff --git a/test/models.json b/test/models.json index 4c3fb8e0b2..4518ce8987 100644 --- a/test/models.json +++ b/test/models.json @@ -2776,14 +2776,14 @@ "type": "mlir", "target": "examples.mnist_xla.mlir", "source": "https://github.com/lutzroeder/netron/files/10672271/examples.mnist_xla.mlir.zip[examples.mnist_xla.mlir]", - "error": "MLIR support is not implemented.", + "format": "MLIR", "link": "https://github.com/lutzroeder/netron/issues/1044" }, { "type": "mlir", "target": "issue_1043.mlir", "source": "https://github.com/lutzroeder/netron/files/10672270/issue_1043.mlir.zip[issue_1043.mlir]", - "error": "MLIR support is not implemented.", + "format": "MLIR", "link": "https://github.com/lutzroeder/netron/issues/1044" }, {