import Logger from "js-logger"; import { reinterpret_f32_as_i32 } from "../primitive_conversion"; import { AssemblyLexer, CodeSectionToken, DataSectionToken, IdentToken, IntToken, LabelToken, RegisterToken, StringSectionToken, StringToken, Token, TokenType, } from "./AssemblyLexer"; import { Arg, DataSegment, Instruction, InstructionSegment, Segment, SegmentType, StringSegment, } from "./instructions"; import { Kind, Opcode, OPCODES_BY_MNEMONIC, Param, StackInteraction } from "./opcodes"; const logger = Logger.get("scripting/assembly"); export type AssemblyWarning = { line_no: number; col: number; length: number; message: string; }; export type AssemblyError = AssemblyWarning; export function assemble( assembly: string[], manual_stack: boolean = false ): { object_code: Segment[]; warnings: AssemblyWarning[]; errors: AssemblyError[]; } { return new Assembler(assembly, manual_stack).assemble(); } class Assembler { private lexer = new AssemblyLexer(); private line_no!: number; private tokens!: Token[]; private object_code!: Segment[]; // The current segment. private segment?: Segment; private warnings!: AssemblyWarning[]; private errors!: AssemblyError[]; // Encountered labels. private labels!: Set; private section!: SegmentType; private first_section_marker = true; constructor(private assembly: string[], private manual_stack: boolean) {} assemble(): { object_code: Segment[]; warnings: AssemblyWarning[]; errors: AssemblyError[]; } { this.line_no = 1; this.object_code = []; this.warnings = []; this.errors = []; this.labels = new Set(); // Need to cast SegmentType.Instructions because of TypeScript bug. this.section = SegmentType.Instructions as SegmentType; this.first_section_marker = true; for (const line of this.assembly) { this.tokens = this.lexer.tokenize_line(line); if (this.tokens.length > 0) { const token = this.tokens.shift()!; switch (token.type) { case TokenType.Label: this.parse_label(token); break; case TokenType.CodeSection: case TokenType.DataSection: case TokenType.StringSection: this.parse_section(token); break; case TokenType.Int: if (this.section === SegmentType.Data) { this.parse_bytes(token); } else { this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); } break; case TokenType.String: if (this.section === SegmentType.String) { this.parse_string(token); } else { this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); } break; case TokenType.Ident: if (this.section === SegmentType.Instructions) { this.parse_instruction(token); } else { this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); } break; case TokenType.InvalidSection: this.add_error({ col: token.col, length: token.len, message: "Invalid section type.", }); break; case TokenType.InvalidIdent: this.add_error({ col: token.col, length: token.len, message: "Invalid identifier.", }); break; default: this.add_error({ col: token.col, length: token.len, message: "Unexpected token.", }); break; } } this.line_no++; } return { object_code: this.object_code, warnings: this.warnings, errors: this.errors, }; } private add_instruction(opcode: Opcode, args: Arg[]): void { if (!this.segment) { // Unreachable code, technically valid. const instruction_segment: InstructionSegment = { labels: [], type: SegmentType.Instructions, instructions: [], }; this.segment = instruction_segment; this.object_code.push(instruction_segment); } else if (this.segment.type === SegmentType.Instructions) { this.segment.instructions.push(new Instruction(opcode, args)); } else { logger.error(`Line ${this.line_no}: Expected instructions segment.`); } } private add_bytes(bytes: number[]): void { if (!this.segment) { // Unadressable data, technically valid. const data_segment: DataSegment = { labels: [], type: SegmentType.Data, data: new Uint8Array(bytes).buffer, }; this.segment = data_segment; this.object_code.push(data_segment); } else if (this.segment.type === SegmentType.Data) { const buf = new ArrayBuffer(this.segment.data.byteLength + bytes.length); const arr = new Uint8Array(buf); arr.set(new Uint8Array(this.segment.data)); arr.set(new Uint8Array(bytes), this.segment.data.byteLength); this.segment.data = buf; } else { logger.error(`Line ${this.line_no}: Expected data segment.`); } } private add_string(str: string): void { if (!this.segment) { // Unadressable data, technically valid. const string_segment: StringSegment = { labels: [], type: SegmentType.String, value: str, }; this.segment = string_segment; this.object_code.push(string_segment); } else if (this.segment.type === SegmentType.String) { this.segment.value += str; } else { logger.error(`Line ${this.line_no}: Expected string segment.`); } } private add_error({ col, length, message, }: { col: number; length: number; message: string; }): void { this.errors.push({ line_no: this.line_no, col, length, message, }); } private add_warning({ col, length, message, }: { col: number; length: number; message: string; }): void { this.warnings.push({ line_no: this.line_no, col, length, message, }); } private parse_label({ col, len, value: label }: LabelToken): void { if (this.labels.has(label)) { this.add_error({ col, length: len, message: "Duplicate label.", }); } this.labels.add(label); const next_token = this.tokens.shift(); switch (this.section) { case SegmentType.Instructions: this.segment = { type: SegmentType.Instructions, labels: [label], instructions: [], }; this.object_code.push(this.segment); if (next_token) { if (next_token.type === TokenType.Ident) { this.parse_instruction(next_token); } else { this.add_error({ col: next_token.col, length: next_token.len, message: "Expected opcode mnemonic.", }); } } break; case SegmentType.Data: this.segment = { type: SegmentType.Data, labels: [label], data: new ArrayBuffer(0), }; this.object_code.push(this.segment); if (next_token) { if (next_token.type === TokenType.Int) { this.parse_bytes(next_token); } else { this.add_error({ col: next_token.col, length: next_token.len, message: "Expected bytes.", }); } } break; case SegmentType.String: this.segment = { type: SegmentType.String, labels: [label], value: "", }; this.object_code.push(this.segment); if (next_token) { if (next_token.type === TokenType.String) { this.parse_string(next_token); } else { this.add_error({ col: next_token.col, length: next_token.len, message: "Expected a string.", }); } } break; } } private parse_section({ type, col, len, }: CodeSectionToken | DataSectionToken | StringSectionToken): void { let section!: SegmentType; switch (type) { case TokenType.CodeSection: section = SegmentType.Instructions; break; case TokenType.DataSection: section = SegmentType.Data; break; case TokenType.StringSection: section = SegmentType.String; break; } if (this.section === section && !this.first_section_marker) { this.add_warning({ col, length: len, message: "Unnecessary section marker.", }); } this.section = section; this.first_section_marker = false; const next_token = this.tokens.shift(); if (next_token) { this.add_error({ col: next_token.col, length: next_token.len, message: "Unexpected token.", }); } } private parse_instruction({ col, len, value }: IdentToken): void { const opcode = OPCODES_BY_MNEMONIC.get(value); if (!opcode) { this.add_error({ col, length: len, message: "Unknown instruction.", }); } else { const varargs = opcode.params.findIndex( p => p.type.kind === Kind.ILabelVar || p.type.kind === Kind.RegRefVar ) !== -1; const param_count = this.manual_stack && opcode.stack === StackInteraction.Pop ? 0 : opcode.params.length; let arg_count = 0; for (const token of this.tokens) { if (token.type !== TokenType.ArgSeperator) { arg_count++; } } const last_token = this.tokens[this.tokens.length - 1]; let error_length = last_token ? last_token.col + last_token.len - col : 0; const ins_args: [Arg, Token][] = []; if (!varargs && arg_count !== param_count) { this.add_error({ col, length: error_length, message: `Expected ${param_count} argument${ param_count === 1 ? "" : "s" }, got ${arg_count}.`, }); return; } else if (varargs && arg_count < param_count) { this.add_error({ col, length: error_length, message: `Expected at least ${param_count} argument${ param_count === 1 ? "" : "s" }, got ${arg_count}.`, }); return; } else if (opcode.stack !== StackInteraction.Pop) { // Inline arguments. if (!this.parse_args(opcode.params, ins_args, false)) { return; } } else { // Stack arguments. const stack_args: [Arg, Token][] = []; if (!this.parse_args(opcode.params, stack_args, true)) { return; } for (let i = 0; i < opcode.params.length; i++) { const param = opcode.params[i]; const arg_and_token = stack_args[i]; if (arg_and_token == undefined) { continue; } const [arg, token] = arg_and_token; if (token.type === TokenType.Register) { if (param.type.kind === Kind.RegTupRef) { this.add_instruction(Opcode.ARG_PUSHB, [arg]); } else { this.add_instruction(Opcode.ARG_PUSHR, [arg]); } } else { switch (param.type.kind) { case Kind.Byte: case Kind.RegRef: case Kind.RegTupRef: this.add_instruction(Opcode.ARG_PUSHB, [arg]); break; case Kind.Word: case Kind.Label: case Kind.ILabel: case Kind.DLabel: case Kind.SLabel: this.add_instruction(Opcode.ARG_PUSHW, [arg]); break; case Kind.DWord: this.add_instruction(Opcode.ARG_PUSHL, [arg]); break; case Kind.Float: this.add_instruction(Opcode.ARG_PUSHL, [ { value: reinterpret_f32_as_i32(arg.value), size: 4, }, ]); break; case Kind.String: this.add_instruction(Opcode.ARG_PUSHS, [arg]); break; default: logger.error( `Line ${this.line_no}: Type ${ Kind[param.type.kind] } not implemented.` ); break; } } } } this.add_instruction(opcode, ins_args.map(([arg]) => arg)); } } /** * @returns true if arguments can be translated to object code, possibly after truncation. False otherwise. */ private parse_args(params: Param[], arg_and_tokens: [Arg, Token][], stack: boolean): boolean { let semi_valid = true; let should_be_arg = true; let param_i = 0; for (let i = 0; i < this.tokens.length; i++) { const token = this.tokens[i]; const param = params[param_i]; if (token.type === TokenType.ArgSeperator) { if (should_be_arg) { this.add_error({ col: token.col, length: token.len, message: "Expected an argument.", }); } else { if (param.type.kind !== Kind.ILabelVar && param.type.kind !== Kind.RegRefVar) { param_i++; } } should_be_arg = true; } else { if (!should_be_arg) { const prev_token = this.tokens[i - 1]; const col = prev_token.col + prev_token.len; this.add_error({ col, length: token.col - col, message: "Expected a comma.", }); } should_be_arg = false; let match: boolean; switch (token.type) { case TokenType.Int: switch (param.type.kind) { case Kind.Byte: match = true; this.parse_int(1, token, arg_and_tokens); break; case Kind.Word: case Kind.Label: case Kind.ILabel: case Kind.DLabel: case Kind.SLabel: case Kind.ILabelVar: match = true; this.parse_int(2, token, arg_and_tokens); break; case Kind.DWord: match = true; this.parse_int(4, token, arg_and_tokens); break; case Kind.Float: match = true; arg_and_tokens.push([ { value: token.value, size: 4, }, token, ]); break; default: match = false; break; } break; case TokenType.Float: match = param.type.kind === Kind.Float; if (match) { arg_and_tokens.push([ { value: token.value, size: 4, }, token, ]); } break; case TokenType.Register: match = stack || param.type.kind === Kind.RegRef || param.type.kind === Kind.RegRefVar || param.type.kind === Kind.RegTupRef; this.parse_register(token, arg_and_tokens); break; case TokenType.String: match = param.type.kind === Kind.String; if (match) { arg_and_tokens.push([ { value: token.value, size: 2 * token.value.length + 2, }, token, ]); } break; default: match = false; break; } if (!match) { semi_valid = false; let type_str: string | undefined; switch (param.type.kind) { case Kind.Byte: type_str = "a 8-bit integer"; break; case Kind.Word: type_str = "a 16-bit integer"; break; case Kind.DWord: type_str = "a 32-bit integer"; break; case Kind.Float: type_str = "a float"; break; case Kind.Label: type_str = "a label"; break; case Kind.ILabel: case Kind.ILabelVar: type_str = "an instruction label"; break; case Kind.DLabel: type_str = "a data label"; break; case Kind.SLabel: type_str = "a string label"; break; case Kind.String: type_str = "a string"; break; case Kind.RegRef: case Kind.RegRefVar: case Kind.RegTupRef: type_str = "a register reference"; break; } if (type_str) { this.add_error({ col: token.col, length: token.len, message: `Expected ${type_str}.`, }); } else { this.add_error({ col: token.col, length: token.len, message: `Unexpected token.`, }); } } } } this.tokens = []; return semi_valid; } private parse_int(size: number, token: IntToken, arg_and_tokens: [Arg, Token][]): void { const { value, col, len } = token; const bit_size = 8 * size; const min_value = -Math.pow(2, bit_size - 1); const max_value = Math.pow(2, bit_size) - 1; if (value < min_value) { this.add_error({ col, length: len, message: `${bit_size}-Bit integer can't be less than ${min_value}.`, }); } else if (value > max_value) { this.add_error({ col, length: len, message: `${bit_size}-Bit integer can't be greater than ${max_value}.`, }); } else { arg_and_tokens.push([ { value, size, }, token, ]); } } private parse_register(token: RegisterToken, arg_and_tokens: [Arg, Token][]): void { const { col, len, value } = token; if (value > 255) { this.add_error({ col, length: len, message: `Invalid register reference, expected r0-r255.`, }); } else { arg_and_tokens.push([ { value, size: 1, }, token, ]); } } private parse_bytes(first_token: IntToken): void { const bytes = []; let token: Token = first_token; let i = 0; while (token.type === TokenType.Int) { if (token.value < 0) { this.add_error({ col: token.col, length: token.len, message: "Unsigned 8-bit integer can't be less than 0.", }); } else if (token.value > 255) { this.add_error({ col: token.col, length: token.len, message: "Unsigned 8-bit integer can't be greater than 255.", }); } bytes.push(token.value); if (i < this.tokens.length) { token = this.tokens[i++]; } else { break; } } if (i < this.tokens.length) { this.add_error({ col: token.col, length: token.len, message: "Expected an unsigned 8-bit integer.", }); } this.add_bytes(bytes); } private parse_string(token: StringToken): void { const next_token = this.tokens.shift(); if (next_token) { this.add_error({ col: next_token.col, length: next_token.len, message: "Unexpected token.", }); } this.add_string(token.value); } }