import { reinterpret_f32_as_i32 } from "../../core/primitive_conversion"; import { AssemblyLexer, CodeSectionToken, DataSectionToken, IdentToken, IntToken, LabelToken, RegisterToken, StringSectionToken, StringToken, Token, TokenType, } from "./AssemblyLexer"; import { Arg, DataSegment, InstructionSegment, new_instruction, Segment, SegmentType, StringSegment, } from "../../core/data_formats/asm/instructions"; import { Kind, OP_ARG_PUSHB, OP_ARG_PUSHL, OP_ARG_PUSHR, OP_ARG_PUSHS, OP_ARG_PUSHW, Opcode, OPCODES_BY_MNEMONIC, Param, StackInteraction, } from "../../core/data_formats/asm/opcodes"; import { LogManager } from "../../core/logging"; const logger = LogManager.get("quest_editor/scripting/assembly"); export type AssemblyWarning = { line_no: number; col: number; length: number; message: string; }; export type AssemblyError = AssemblyWarning; export type AssemblySettings = { manual_stack: boolean; }; export function assemble( assembly: string[], manual_stack = false, ): { object_code: Segment[]; warnings: AssemblyWarning[]; errors: AssemblyError[]; } { logger.trace("assemble start"); const result = new Assembler(assembly, manual_stack).assemble(); logger.trace( `assemble end with ${result.warnings.length} warnings and ${result.errors.length} errors.`, ); return result; } class Assembler { private readonly lexer = new AssemblyLexer(); private line_no!: number; private tokens!: Token[]; private object_code!: Segment[]; /** * The current segment. */ private segment?: Segment; private warnings!: AssemblyWarning[]; private errors!: AssemblyError[]; /** * Encountered labels. */ private labels!: Set; private section: SegmentType = SegmentType.Instructions; private first_section_marker = true; private prev_line_had_label = false; constructor(private readonly assembly: string[], private readonly manual_stack: boolean) {} assemble(): { object_code: Segment[]; warnings: AssemblyWarning[]; errors: AssemblyError[]; } { // Reset all state. this.line_no = 1; this.object_code = []; this.warnings = []; this.errors = []; this.labels = new Set(); // Need to cast SegmentType.Instructions because of TypeScript bug. this.section = SegmentType.Instructions as SegmentType; this.first_section_marker = true; this.prev_line_had_label = false; // Tokenize and assemble line by line. for (const line of this.assembly) { this.tokens = this.lexer.tokenize_line(line); if (this.tokens.length > 0) { const token = this.tokens.shift()!; let has_label = false; switch (token.type) { case TokenType.Label: this.parse_label(token); has_label = true; break; case TokenType.CodeSection: case TokenType.DataSection: case TokenType.StringSection: this.parse_section(token); break; case TokenType.Int: if (this.section === SegmentType.Data) { this.parse_bytes(token); } else { this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); } break; case TokenType.String: if (this.section === SegmentType.String) { this.parse_string(token); } else { this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); } break; case TokenType.Ident: if (this.section === SegmentType.Instructions) { this.parse_instruction(token); } else { this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); } break; case TokenType.InvalidSection: this.add_error({ col: token.col, length: token.len, message: "Invalid section type.", }); break; case TokenType.InvalidIdent: this.add_error({ col: token.col, length: token.len, message: "Invalid identifier.", }); break; default: this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); break; } this.prev_line_had_label = has_label; } this.line_no++; } return { object_code: this.object_code, warnings: this.warnings, errors: this.errors, }; } private add_instruction( opcode: Opcode, args: Arg[], stack_args: Arg[], token: Token | undefined, arg_tokens: Token[], stack_arg_tokens: Token[], ): void { if (!this.segment) { // Unreachable code, technically valid. const instruction_segment: InstructionSegment = { labels: [], type: SegmentType.Instructions, instructions: [], asm: { labels: [], }, }; this.segment = instruction_segment; this.object_code.push(instruction_segment); } else if (this.segment.type === SegmentType.Instructions) { this.segment.instructions.push( new_instruction(opcode, args, { mnemonic: token && { line_no: this.line_no, col: token.col, len: token.len, }, args: arg_tokens.map(arg_t => ({ line_no: this.line_no, col: arg_t.col, len: arg_t.len, })), stack_args: stack_arg_tokens.map((arg_t, i) => ({ line_no: this.line_no, col: arg_t.col, len: arg_t.len, value: stack_args[i].value, })), }), ); } else { logger.error(`Line ${this.line_no}: Expected instructions segment.`); } } private add_bytes(bytes: number[]): void { if (!this.segment) { // Unaddressable data, technically valid. const data_segment: DataSegment = { labels: [], type: SegmentType.Data, data: new Uint8Array(bytes).buffer, asm: { labels: [], }, }; this.segment = data_segment; this.object_code.push(data_segment); } else if (this.segment.type === SegmentType.Data) { const buf = new ArrayBuffer(this.segment.data.byteLength + bytes.length); const arr = new Uint8Array(buf); arr.set(new Uint8Array(this.segment.data)); arr.set(new Uint8Array(bytes), this.segment.data.byteLength); this.segment.data = buf; } else { logger.error(`Line ${this.line_no}: Expected data segment.`); } } private add_string(str: string): void { if (!this.segment) { // Unaddressable data, technically valid. const string_segment: StringSegment = { labels: [], type: SegmentType.String, value: str, asm: { labels: [], }, }; this.segment = string_segment; this.object_code.push(string_segment); } else if (this.segment.type === SegmentType.String) { this.segment.value += str; } else { logger.error(`Line ${this.line_no}: Expected string segment.`); } } private add_error({ col, length, message, }: { col: number; length: number; message: string; }): void { this.errors.push({ line_no: this.line_no, col, length, message, }); } private add_warning({ col, length, message, }: { col: number; length: number; message: string; }): void { this.warnings.push({ line_no: this.line_no, col, length, message, }); } private parse_label({ col, len, value: label }: LabelToken): void { if (this.labels.has(label)) { this.add_error({ col, length: len, message: "Duplicate label.", }); } this.labels.add(label); const next_token = this.tokens.shift(); const asm = { line_no: this.line_no, col, len }; if (this.prev_line_had_label) { const segment = this.object_code[this.object_code.length - 1]; segment.labels.push(label); segment.asm.labels.push(asm); } switch (this.section) { case SegmentType.Instructions: if (!this.prev_line_had_label) { this.segment = { type: SegmentType.Instructions, labels: [label], instructions: [], asm: { labels: [asm] }, }; this.object_code.push(this.segment); } if (next_token) { if (next_token.type === TokenType.Ident) { this.parse_instruction(next_token); } else { this.add_error({ col: next_token.col, length: next_token.len, message: "Expected opcode mnemonic.", }); } } break; case SegmentType.Data: if (!this.prev_line_had_label) { this.segment = { type: SegmentType.Data, labels: [label], data: new ArrayBuffer(0), asm: { labels: [asm], }, }; this.object_code.push(this.segment); } if (next_token) { if (next_token.type === TokenType.Int) { this.parse_bytes(next_token); } else { this.add_error({ col: next_token.col, length: next_token.len, message: "Expected bytes.", }); } } break; case SegmentType.String: if (!this.prev_line_had_label) { this.segment = { type: SegmentType.String, labels: [label], value: "", asm: { labels: [asm], }, }; this.object_code.push(this.segment); } if (next_token) { if (next_token.type === TokenType.String) { this.parse_string(next_token); } else { this.add_error({ col: next_token.col, length: next_token.len, message: "Expected a string.", }); } } break; } } private parse_section({ type, col, len, }: CodeSectionToken | DataSectionToken | StringSectionToken): void { let section!: SegmentType; switch (type) { case TokenType.CodeSection: section = SegmentType.Instructions; break; case TokenType.DataSection: section = SegmentType.Data; break; case TokenType.StringSection: section = SegmentType.String; break; } if (this.section === section && !this.first_section_marker) { this.add_warning({ col, length: len, message: "Unnecessary section marker.", }); } this.section = section; this.first_section_marker = false; const next_token = this.tokens.shift(); if (next_token) { this.add_error({ col: next_token.col, length: next_token.len, message: "Unexpected token.", }); } } private parse_instruction(ident_token: IdentToken): void { const { col, len, value } = ident_token; const opcode = OPCODES_BY_MNEMONIC.get(value); if (!opcode) { this.add_error({ col, length: len, message: "Unknown instruction.", }); } else { const varargs = opcode.params.findIndex( p => p.type.kind === Kind.ILabelVar || p.type.kind === Kind.RegRefVar, ) !== -1; const param_count = this.manual_stack && opcode.stack === StackInteraction.Pop ? 0 : opcode.params.length; let arg_count = 0; for (const token of this.tokens) { if (token.type !== TokenType.ArgSeparator) { arg_count++; } } const last_token = this.tokens[this.tokens.length - 1]; const error_length = last_token ? last_token.col + last_token.len - col : 0; // Inline arguments. const ins_arg_and_tokens: [Arg, Token][] = []; // Stack arguments. const stack_arg_and_tokens: [Arg, Token][] = []; if (!varargs && arg_count !== param_count) { this.add_error({ col, length: error_length, message: `Expected ${param_count} argument${ param_count === 1 ? "" : "s" }, got ${arg_count}.`, }); return; } else if (varargs && arg_count < param_count) { this.add_error({ col, length: error_length, message: `Expected at least ${param_count} argument${ param_count === 1 ? "" : "s" }, got ${arg_count}.`, }); return; } else if (opcode.stack !== StackInteraction.Pop) { // Inline arguments. if (!this.parse_args(opcode.params, ins_arg_and_tokens, false)) { return; } } else { if (!this.parse_args(opcode.params, stack_arg_and_tokens, true)) { return; } for (let i = 0; i < opcode.params.length; i++) { const param = opcode.params[i]; const arg_and_token = stack_arg_and_tokens[i]; if (arg_and_token == undefined) { continue; } const [arg, arg_token] = arg_and_token; if (arg_token.type === TokenType.Register) { if (param.type.kind === Kind.RegTupRef) { this.add_instruction( OP_ARG_PUSHB, [arg], [], undefined, [arg_token], [], ); } else { this.add_instruction( OP_ARG_PUSHR, [arg], [], undefined, [arg_token], [], ); } } else { switch (param.type.kind) { case Kind.Byte: case Kind.RegRef: case Kind.RegTupRef: this.add_instruction( OP_ARG_PUSHB, [arg], [], undefined, [arg_token], [], ); break; case Kind.Word: case Kind.Label: case Kind.ILabel: case Kind.DLabel: case Kind.SLabel: this.add_instruction( OP_ARG_PUSHW, [arg], [], undefined, [arg_token], [], ); break; case Kind.DWord: this.add_instruction( OP_ARG_PUSHL, [arg], [], undefined, [arg_token], [], ); break; case Kind.Float: this.add_instruction( OP_ARG_PUSHL, [{ value: reinterpret_f32_as_i32(arg.value) }], [], undefined, [arg_token], [], ); break; case Kind.String: this.add_instruction( OP_ARG_PUSHS, [arg], [], undefined, [arg_token], [], ); break; default: logger.error( `Line ${this.line_no}: Type ${ Kind[param.type.kind] } not implemented.`, ); break; } } } } const args: Arg[] = []; const arg_tokens: Token[] = []; const stack_args: Arg[] = []; const stack_arg_tokens: Token[] = []; for (const [arg, token] of ins_arg_and_tokens) { args.push(arg); arg_tokens.push(token); } for (const [arg, token] of stack_arg_and_tokens) { stack_args.push(arg); stack_arg_tokens.push(token); } this.add_instruction( opcode, args, stack_args, ident_token, arg_tokens, stack_arg_tokens, ); } } /** * @returns true if arguments can be translated to object code, possibly after truncation. False otherwise. */ private parse_args( params: readonly Param[], arg_and_tokens: [Arg, Token][], stack: boolean, ): boolean { let semi_valid = true; let should_be_arg = true; let param_i = 0; for (let i = 0; i < this.tokens.length; i++) { const token = this.tokens[i]; const param = params[param_i]; if (token.type === TokenType.ArgSeparator) { if (should_be_arg) { this.add_error({ col: token.col, length: token.len, message: "Expected an argument.", }); } else if ( param.type.kind !== Kind.ILabelVar && param.type.kind !== Kind.RegRefVar ) { param_i++; } should_be_arg = true; } else { if (!should_be_arg) { const prev_token = this.tokens[i - 1]; const col = prev_token.col + prev_token.len; this.add_error({ col, length: token.col - col, message: "Expected a comma.", }); } should_be_arg = false; let match: boolean; switch (token.type) { case TokenType.Int: switch (param.type.kind) { case Kind.Byte: match = true; this.parse_int(1, token, arg_and_tokens); break; case Kind.Word: case Kind.Label: case Kind.ILabel: case Kind.DLabel: case Kind.SLabel: case Kind.ILabelVar: match = true; this.parse_int(2, token, arg_and_tokens); break; case Kind.DWord: match = true; this.parse_int(4, token, arg_and_tokens); break; case Kind.Float: match = true; arg_and_tokens.push([{ value: token.value }, token]); break; default: match = false; break; } break; case TokenType.Float: match = param.type.kind === Kind.Float; if (match) { arg_and_tokens.push([{ value: token.value }, token]); } break; case TokenType.Register: match = stack || param.type.kind === Kind.RegRef || param.type.kind === Kind.RegRefVar || param.type.kind === Kind.RegTupRef; this.parse_register(token, arg_and_tokens); break; case TokenType.String: match = param.type.kind === Kind.String; if (match) { arg_and_tokens.push([{ value: token.value }, token]); } break; default: match = false; break; } if (!match) { semi_valid = false; let type_str: string | undefined; switch (param.type.kind) { case Kind.Byte: type_str = "an 8-bit integer"; break; case Kind.Word: type_str = "a 16-bit integer"; break; case Kind.DWord: type_str = "a 32-bit integer"; break; case Kind.Float: type_str = "a float"; break; case Kind.Label: type_str = "a label"; break; case Kind.ILabel: case Kind.ILabelVar: type_str = "an instruction label"; break; case Kind.DLabel: type_str = "a data label"; break; case Kind.SLabel: type_str = "a string label"; break; case Kind.String: type_str = "a string"; break; case Kind.RegRef: case Kind.RegRefVar: case Kind.RegTupRef: type_str = "a register reference"; break; } if (type_str) { this.add_error({ col: token.col, length: token.len, message: `Expected ${type_str}.`, }); } else { this.add_error({ col: token.col, length: token.len, message: `Unexpected token.`, }); } } } } this.tokens = []; return semi_valid; } private parse_int(size: number, token: IntToken, arg_and_tokens: [Arg, Token][]): void { const { value, col, len } = token; const bit_size = 8 * size; const min_value = -Math.pow(2, bit_size - 1); const max_value = Math.pow(2, bit_size) - 1; if (value < min_value) { this.add_error({ col, length: len, message: `${bit_size}-Bit integer can't be less than ${min_value}.`, }); } else if (value > max_value) { this.add_error({ col, length: len, message: `${bit_size}-Bit integer can't be greater than ${max_value}.`, }); } else { arg_and_tokens.push([{ value }, token]); } } private parse_register(token: RegisterToken, arg_and_tokens: [Arg, Token][]): void { const { col, len, value } = token; if (value > 255) { this.add_error({ col, length: len, message: `Invalid register reference, expected r0-r255.`, }); } else { arg_and_tokens.push([{ value }, token]); } } private parse_bytes(first_token: IntToken): void { const bytes = []; let token: Token = first_token; let i = 0; while (token.type === TokenType.Int) { if (token.value < 0) { this.add_error({ col: token.col, length: token.len, message: "Unsigned 8-bit integer can't be less than 0.", }); } else if (token.value > 255) { this.add_error({ col: token.col, length: token.len, message: "Unsigned 8-bit integer can't be greater than 255.", }); } bytes.push(token.value); if (i < this.tokens.length) { token = this.tokens[i++]; } else { break; } } if (i < this.tokens.length) { this.add_error({ col: token.col, length: token.len, message: "Expected an unsigned 8-bit integer.", }); } this.add_bytes(bytes); } private parse_string(token: StringToken): void { const next_token = this.tokens.shift(); if (next_token) { this.add_error({ col: next_token.col, length: next_token.len, message: "Unexpected token.", }); } this.add_string(token.value.replace(/\n/g, "")); } }