From 769e6a86197cb09d23fad304e9f4ebcc3fdf2122 Mon Sep 17 00:00:00 2001 From: Daan Vanden Bosch Date: Mon, 22 Jul 2019 16:03:58 +0200 Subject: [PATCH] Added basic assembler. --- src/data_formats/parsing/quest/opcodes.ts | 30 ++- src/scripting/assembly.test.ts | 60 +++++ src/scripting/assembly.ts | 250 ++++++++++++++++++ src/{ui => }/scripting/disassembly.ts | 15 +- src/ui/quest_editor/ScriptEditorComponent.tsx | 24 +- 5 files changed, 360 insertions(+), 19 deletions(-) create mode 100644 src/scripting/assembly.test.ts create mode 100644 src/scripting/assembly.ts rename src/{ui => }/scripting/disassembly.ts (84%) diff --git a/src/data_formats/parsing/quest/opcodes.ts b/src/data_formats/parsing/quest/opcodes.ts index 5bde289e..1c3db220 100644 --- a/src/data_formats/parsing/quest/opcodes.ts +++ b/src/data_formats/parsing/quest/opcodes.ts @@ -1,24 +1,44 @@ +import { string } from "prop-types"; + /** * Instruction parameter types. */ export enum Type { + /** + * Unsigned 8-bit integer. + */ U8, + /** + * Unsigned 16-bit integer. + */ U16, + /** + * Unsigned 32-bit integer. + */ U32, + /** + * Signed 32-bit integer. + */ I32, + /** + * 32-Bit floating point number. + */ F32, /** * Register reference */ Register, /** - * Variable amount of u8 arguments. + * Arbitrary amount of u8 arguments. */ U8Var, /** - * Variable amount of u16 arguments. + * Arbitrary amount of u16 arguments. */ U16Var, + /** + * String of arbitrary size. + */ String, } @@ -4902,3 +4922,9 @@ export class Opcode { [] )); } + +export const OPCODES_BY_MNEMONIC = new Map(); + +OPCODES.forEach(opcode => { + OPCODES_BY_MNEMONIC.set(opcode.mnemonic, opcode); +}); diff --git a/src/scripting/assembly.test.ts b/src/scripting/assembly.test.ts new file mode 100644 index 00000000..73a19a98 --- /dev/null +++ b/src/scripting/assembly.test.ts @@ -0,0 +1,60 @@ +import { assemble } from "./assembly"; +import { Opcode } from "../data_formats/parsing/quest/bin"; + +test("", () => { + const { instructions, labels, errors } = assemble(` + 0: set_episode 0 + bb_map_designate 1, 2, 3, 4 + set_floor_handler 0, 150 + set_floor_handler 1, 151 + ret + 150: set_mainwarp 1 + ret + 151: ret + `); + + expect(errors).toEqual([]); + + expect(instructions.length).toBe(13); + + expect(instructions[0].opcode).toBe(Opcode.set_episode); + expect(instructions[0].args).toEqual([{ value: 0, size: 4 }]); + + expect(instructions[1].opcode).toBe(Opcode.bb_map_designate); + expect(instructions[1].args).toEqual([ + { value: 1, size: 1 }, + { value: 2, size: 2 }, + { value: 3, size: 1 }, + { value: 4, size: 1 }, + ]); + + expect(instructions[2].opcode).toBe(Opcode.arg_pushl); + expect(instructions[2].args).toEqual([{ value: 0, size: 4 }]); + expect(instructions[3].opcode).toBe(Opcode.arg_pushw); + expect(instructions[3].args).toEqual([{ value: 150, size: 2 }]); + expect(instructions[4].opcode).toBe(Opcode.set_floor_handler); + expect(instructions[4].args).toEqual([]); + + expect(instructions[5].opcode).toBe(Opcode.arg_pushl); + expect(instructions[5].args).toEqual([{ value: 1, size: 4 }]); + expect(instructions[6].opcode).toBe(Opcode.arg_pushw); + expect(instructions[6].args).toEqual([{ value: 151, size: 2 }]); + expect(instructions[7].opcode).toBe(Opcode.set_floor_handler); + expect(instructions[7].args).toEqual([]); + + expect(instructions[8].opcode).toBe(Opcode.ret); + expect(instructions[8].args).toEqual([]); + + expect(instructions[9].opcode).toBe(Opcode.arg_pushl); + expect(instructions[9].args).toEqual([{ value: 1, size: 4 }]); + expect(instructions[10].opcode).toBe(Opcode.set_mainwarp); + expect(instructions[10].args).toEqual([]); + + expect(instructions[11].opcode).toBe(Opcode.ret); + expect(instructions[11].args).toEqual([]); + + expect(instructions[12].opcode).toBe(Opcode.ret); + expect(instructions[12].args).toEqual([]); + + expect(labels).toEqual(new Map([[0, 0], [150, 9], [151, 12]])); +}); diff --git a/src/scripting/assembly.ts b/src/scripting/assembly.ts new file mode 100644 index 00000000..68216cbe --- /dev/null +++ b/src/scripting/assembly.ts @@ -0,0 +1,250 @@ +import { + Instruction, + OPCODES_BY_MNEMONIC, + Arg, + Type, + Opcode, + Param, +} from "../data_formats/parsing/quest/bin"; + +type DisassemblyError = { + line: number; + col: number; + length: number; + description: string; +}; + +export function assemble( + assembly: string, + manual_stack: boolean = false +): { + instructions: Instruction[]; + labels: Map; + errors: DisassemblyError[]; +} { + const errors: DisassemblyError[] = []; + const instructions: Instruction[] = []; + const labels = new Map(); + + let line = 1; + + for (const line_text of assembly.split("\n")) { + const match = line_text.match( + /^(?\s*)(?[^\s]+?:)?(?\s*)(?[a-z][a-z_=<>!]*)?(?.*)$/ + ); + + if (!match || !match.groups || (match.groups.lbl == null && match.groups.op == null)) { + const left_trimmed = line_text.trimLeft(); + const trimmed = left_trimmed.trimRight(); + + if (trimmed.length) { + errors.push({ + line, + col: line_text.length - left_trimmed.length, + length: trimmed.length, + description: "Expected label or instruction.", + }); + } + } else { + const { lbl_ws, lbl, op_ws, op, args } = match.groups; + + if (lbl != null) { + const label = parseInt(lbl.slice(0, -1), 10); + + if (!isFinite(label)) { + errors.push({ + line, + col: lbl_ws.length, + length: lbl.length, + description: "Invalid label name.", + }); + } else if (labels.has(label)) { + errors.push({ + line, + col: lbl_ws.length, + length: lbl.length - 1, + description: "Duplicate label.", + }); + } else { + labels.set(label, instructions.length); + } + } + + if (op != null) { + const opcode = OPCODES_BY_MNEMONIC.get(op); + + if (!opcode) { + errors.push({ + line, + col: lbl_ws.length + (lbl ? lbl.length : 0) + op_ws.length, + length: op.length, + description: "Unknown instruction.", + }); + } else { + const args_col = + lbl_ws.length + + (lbl ? lbl.length : 0) + + op_ws.length + + (op ? op.length : 0); + + const arg_tokens: ArgToken[] = []; + const args_tokenization_ok = tokenize_args(args, args_col, arg_tokens); + + const ins_args: Arg[] = []; + + if (!args_tokenization_ok) { + const left_trimmed = args.trimLeft(); + const trimmed = args.trimRight(); + + if (trimmed.trim().length) { + errors.push({ + line, + col: args_col + args.length - left_trimmed.length, + length: trimmed.length, + description: "Instruction arguments expected.", + }); + } + } else { + const param_count = + opcode.params.length + (manual_stack ? 0 : opcode.stack_params.length); + + if (arg_tokens.length !== param_count) { + const left_trimmed = line_text.trimLeft(); + const trimmed = left_trimmed.trimRight(); + errors.push({ + line, + col: line_text.length - left_trimmed.length, + length: trimmed.length, + description: `Expected ${param_count} arguments, got ${arg_tokens.length}.`, + }); + } else if (arg_tokens.length === opcode.params.length) { + parse_args(opcode.params, arg_tokens, ins_args); + } else { + const stack_args: Arg[] = []; + parse_args(opcode.stack_params, arg_tokens, stack_args); + + // TODO: proper error checking. + // TODO: UVars. + for (let i = 0; i < opcode.stack_params.length; i++) { + const param = opcode.stack_params[i]; + const arg = stack_args[i]; + + switch (param.type) { + case Type.U8: + case Type.Register: + instructions.push(new Instruction(Opcode.arg_pushb, [arg])); + break; + case Type.U16: + instructions.push(new Instruction(Opcode.arg_pushw, [arg])); + break; + case Type.U32: + case Type.I32: + case Type.F32: + instructions.push(new Instruction(Opcode.arg_pushl, [arg])); + break; + case Type.String: + instructions.push(new Instruction(Opcode.arg_pushs, [arg])); + break; + default: + throw new Error( + `Type ${Type[param.type]} not implemented yet.` + ); + } + } + } + } + + instructions.push(new Instruction(opcode, ins_args)); + } + } + } + + line++; + } + + return { + instructions, + labels, + errors, + }; +} + +type ArgToken = { + col: number; + arg: string; +}; + +function tokenize_args(arg_str: string, col: number, args: ArgToken[]): boolean { + if (arg_str.length === 0) { + return true; + } + + let match: RegExpMatchArray | null; + + if (args.length === 0) { + match = arg_str.match(/^(?\s+)(?"([^"\\]|\\.)*"|[^\s,]+)\s*/); + } else { + match = arg_str.match(/^(?,\s*)(?"([^"\\]|\\.)*"|[^\s,]+)\s*/); + } + + if (!match || !match.groups) { + return false; + } else { + const { arg_ws, arg } = match.groups; + args.push({ + col: col + arg_ws.length, + arg, + }); + + return tokenize_args(arg_str.slice(match[0].length), col + match[0].length, args); + } +} + +// TODO: proper error checking. +// TODO: UVars. +function parse_args(params: Param[], arg_tokens: ArgToken[], args: Arg[]): void { + for (let i = 0; i < params.length; i++) { + const param = params[i]; + const arg_str = arg_tokens[i].arg; + + switch (param.type) { + case Type.U8: + args.push({ + value: parseInt(arg_str, 10), + size: 1, + }); + break; + case Type.U16: + args.push({ + value: parseInt(arg_str, 10), + size: 2, + }); + break; + case Type.U32: + case Type.I32: + case Type.F32: + args.push({ + value: parseInt(arg_str, 10), + size: 4, + }); + break; + case Type.Register: + args.push({ + value: parseInt(arg_str.slice(1), 10), + size: 1, + }); + break; + case Type.String: + { + const value: string = JSON.parse(arg_str); + args.push({ + value, + size: 2 + 2 * value.length, + }); + } + break; + default: + throw new Error(`Type ${Type[param.type]} not implemented yet.`); + } + } +} diff --git a/src/ui/scripting/disassembly.ts b/src/scripting/disassembly.ts similarity index 84% rename from src/ui/scripting/disassembly.ts rename to src/scripting/disassembly.ts index ad026009..0ec9f6e6 100644 --- a/src/ui/scripting/disassembly.ts +++ b/src/scripting/disassembly.ts @@ -1,17 +1,20 @@ -import { Arg, Param, Type } from "../../data_formats/parsing/quest/bin"; -import { Quest } from "../../domain"; +import { Arg, Instruction, Param, Type } from "../data_formats/parsing/quest/bin"; /** * @param manual_stack If true, will ouput stack management instructions (argpush variants). Otherwise stack management instructions will not be output and their arguments will be output as arguments to the instruction that pops them from the stack. */ -export function disassemble(quest: Quest, manual_stack: boolean = false): string { +export function disassemble( + instructions: Instruction[], + labels: Map, + manual_stack: boolean = false +): string { const lines: string[] = []; - const index_to_label = new Map([...quest.labels.entries()].map(([l, i]) => [i, l])); + const index_to_label = new Map([...labels.entries()].map(([l, i]) => [i, l])); const stack: Arg[] = []; - for (let i = 0; i < quest.instructions.length; ++i) { - const ins = quest.instructions[i]; + for (let i = 0; i < instructions.length; ++i) { + const ins = instructions[i]; const label = index_to_label.get(i); if (!manual_stack && ins.opcode.push_stack) { diff --git a/src/ui/quest_editor/ScriptEditorComponent.tsx b/src/ui/quest_editor/ScriptEditorComponent.tsx index 581ad08c..f0a452d7 100644 --- a/src/ui/quest_editor/ScriptEditorComponent.tsx +++ b/src/ui/quest_editor/ScriptEditorComponent.tsx @@ -4,7 +4,7 @@ import { AutoSizer } from "react-virtualized"; import { OPCODES } from "../../data_formats/parsing/quest/bin"; import { quest_editor_store } from "../../stores/QuestEditorStore"; import "./ScriptEditorComponent.less"; -import { disassemble } from "../scripting/disassembly"; +import { disassemble } from "../../scripting/disassembly"; import { IReactionDisposer, autorun } from "mobx"; const ASM_SYNTAX: languages.IMonarchLanguage = { @@ -13,7 +13,7 @@ const ASM_SYNTAX: languages.IMonarchLanguage = { tokenizer: { root: [ // Identifiers. - [/[a-z][\w=<>!]*/, "identifier"], + [/[a-z][a-z_=<>!]*/, "identifier"], // Labels. [/^\d+:/, "tag"], @@ -23,8 +23,8 @@ const ASM_SYNTAX: languages.IMonarchLanguage = { // Whitespace. [/[ \t\r\n]+/, "white"], - [/\/\*/, "comment", "@comment"], - [/\/\/.*$/, "comment"], + // [/\/\*/, "comment", "@comment"], + // [/\/\/.*$/, "comment"], // Numbers. [/-?\d*\.\d+([eE][-+]?\d+)?/, "number.float"], @@ -39,12 +39,12 @@ const ASM_SYNTAX: languages.IMonarchLanguage = { [/"/, { token: "string.quote", bracket: "@open", next: "@string" }], ], - comment: [ - [/[^/*]+/, "comment"], - [/\/\*/, "comment", "@push"], // Nested comment. - [/\*\//, "comment", "@pop"], - [/[/*]/, "comment"], - ], + // comment: [ + // [/[^/*]+/, "comment"], + // [/\/\*/, "comment", "@push"], // Nested comment. + // [/\*\//, "comment", "@pop"], + // [/[/*]/, "comment"], + // ], string: [ [/[^\\"]+/, "string"], @@ -139,7 +139,9 @@ class MonacoComponent extends Component { this.disposer = autorun(() => { const quest = quest_editor_store.current_quest; - const model = quest && editor.createModel(disassemble(quest), "psoasm"); + const model = + quest && + editor.createModel(disassemble(quest.instructions, quest.labels, true), "psoasm"); if (model && this.editor) { // model.onDidChangeContent(e => {