mirror of
https://github.com/DaanVandenBosch/phantasmal-world.git
synced 2025-04-05 07:18:29 +08:00
Fixed .qst embedded file naming bug. Implemented simpler PRS compression algorithm that seems to cause fewer errors during roundtrip tests.
This commit is contained in:
parent
194df177ab
commit
48b683f514
@ -1,130 +1,101 @@
|
|||||||
|
import { Endianness } from "../..";
|
||||||
import { Cursor } from "../../cursor/Cursor";
|
import { Cursor } from "../../cursor/Cursor";
|
||||||
import { ResizableBufferCursor } from "../../cursor/ResizableBufferCursor";
|
import { ResizableBufferCursor } from "../../cursor/ResizableBufferCursor";
|
||||||
import { WritableCursor } from "../../cursor/WritableCursor";
|
import { WritableCursor } from "../../cursor/WritableCursor";
|
||||||
import { ResizableBuffer } from "../../ResizableBuffer";
|
import { ResizableBuffer } from "../../ResizableBuffer";
|
||||||
|
|
||||||
export function prs_compress(src: Cursor): Cursor {
|
export function prs_compress(cursor: Cursor): Cursor {
|
||||||
const ctx = new Context(src);
|
const pc = new Context(cursor.size, cursor.endianness);
|
||||||
const hash_table = new HashTable();
|
|
||||||
|
|
||||||
if (ctx.src.size <= 3) {
|
while (cursor.bytes_left) {
|
||||||
// Make a literal copy of the input.
|
// Find the longest match.
|
||||||
while (ctx.src.bytes_left) {
|
let best_offset = 0;
|
||||||
ctx.set_bit(1);
|
let best_size = 0;
|
||||||
ctx.copy_literal();
|
const min_offset = Math.max(0, cursor.position - Math.min(0x800, cursor.bytes_left));
|
||||||
}
|
|
||||||
} else {
|
|
||||||
// Add the first two "strings" to the hash table.
|
|
||||||
hash_table.put(hash_table.hash(ctx.src), 0);
|
|
||||||
ctx.src.seek(1);
|
|
||||||
hash_table.put(hash_table.hash(ctx.src), 1);
|
|
||||||
ctx.src.seek(-1);
|
|
||||||
|
|
||||||
// Copy the first two bytes as literals.
|
for (let i = cursor.position - 255; i >= min_offset; i--) {
|
||||||
ctx.set_bit(1);
|
let s1 = cursor.position;
|
||||||
ctx.copy_literal();
|
let s2 = i;
|
||||||
ctx.set_bit(1);
|
let size = 0;
|
||||||
ctx.copy_literal();
|
|
||||||
|
|
||||||
while (ctx.src.bytes_left > 1) {
|
// Optimization: compare 4 bytes at a time while we can.
|
||||||
let [offset, mlen] = ctx.find_longest_match(hash_table, false);
|
while (s1 + 3 < cursor.size && size < 252 && cursor.u32_at(s1) === cursor.u32_at(s2)) {
|
||||||
|
size += 4;
|
||||||
if (mlen > 0) {
|
s1 += 4;
|
||||||
ctx.src.seek(1);
|
s2 += 4;
|
||||||
const [offset2, mlen2] = ctx.find_longest_match(hash_table, true);
|
|
||||||
ctx.src.seek(-1);
|
|
||||||
|
|
||||||
// Did the "lazy match" produce something more compressed?
|
|
||||||
if (mlen2 > mlen) {
|
|
||||||
let copy_literal = true;
|
|
||||||
// Check if it is a good idea to switch from a short match to a long one.
|
|
||||||
if (mlen >= 2 && mlen <= 5 && offset2 < offset) {
|
|
||||||
if (offset >= -256 && offset2 < -256) {
|
|
||||||
if (mlen2 - mlen < 3) {
|
|
||||||
copy_literal = false;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
if (copy_literal) {
|
|
||||||
ctx.set_bit(1);
|
|
||||||
ctx.copy_literal();
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// What kind of match did we find?
|
|
||||||
if (mlen >= 2 && mlen <= 5 && offset >= -256) {
|
|
||||||
// Short match.
|
|
||||||
ctx.set_bit(0);
|
|
||||||
ctx.set_bit(0);
|
|
||||||
ctx.set_bit((mlen - 2) & 0x02);
|
|
||||||
ctx.set_bit((mlen - 2) & 0x01);
|
|
||||||
ctx.write_literal(offset & 0xff);
|
|
||||||
ctx.add_intermediates(hash_table, mlen);
|
|
||||||
continue;
|
|
||||||
} else if (mlen >= 3 && mlen <= 9) {
|
|
||||||
// Long match, short length.
|
|
||||||
ctx.set_bit(0);
|
|
||||||
ctx.set_bit(1);
|
|
||||||
ctx.write_literal(((offset & 0x1f) << 3) | ((mlen - 2) & 0x07));
|
|
||||||
ctx.write_literal(offset >> 5);
|
|
||||||
ctx.add_intermediates(hash_table, mlen);
|
|
||||||
continue;
|
|
||||||
} else if (mlen > 9) {
|
|
||||||
// Long match, long length.
|
|
||||||
if (mlen > 256) {
|
|
||||||
mlen = 256;
|
|
||||||
}
|
|
||||||
|
|
||||||
ctx.set_bit(0);
|
|
||||||
ctx.set_bit(1);
|
|
||||||
ctx.write_literal((offset & 0x1f) << 3);
|
|
||||||
ctx.write_literal(offset >> 5);
|
|
||||||
ctx.write_literal(mlen - 1);
|
|
||||||
ctx.add_intermediates(hash_table, mlen);
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// If we get here, we didn't find a suitable match, so just we just make a literal copy.
|
while (s1 < cursor.size && size < 255 && cursor.u8_at(s1) === cursor.u8_at(s2)) {
|
||||||
ctx.set_bit(1);
|
size++;
|
||||||
ctx.copy_literal();
|
s1++;
|
||||||
|
s2++;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (size >= best_size) {
|
||||||
|
best_offset = i;
|
||||||
|
best_size = size;
|
||||||
|
|
||||||
|
if (size >= 255) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// If there's a left over byte at the end, make a literal copy.
|
if (best_size < 3) {
|
||||||
if (ctx.src.bytes_left) {
|
pc.add_u8(cursor.u8());
|
||||||
ctx.set_bit(1);
|
} else {
|
||||||
ctx.copy_literal();
|
pc.copy(best_offset - cursor.position, best_size);
|
||||||
|
cursor.seek(best_size);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
ctx.write_eof();
|
return pc.finalize();
|
||||||
|
|
||||||
return ctx.dst.seek_start(0);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
const MAX_WINDOW = 0x2000;
|
|
||||||
const WINDOW_MASK = MAX_WINDOW - 1;
|
|
||||||
const HASH_SIZE = 1 << 8;
|
|
||||||
|
|
||||||
class Context {
|
class Context {
|
||||||
src: Cursor;
|
private readonly output: WritableCursor;
|
||||||
dst: WritableCursor;
|
private flags = 0;
|
||||||
flags = 0;
|
private flag_bits_left = 0;
|
||||||
flag_bits_left = 0;
|
private flag_offset = 0;
|
||||||
flag_offset = 0;
|
|
||||||
|
|
||||||
constructor(cursor: Cursor) {
|
constructor(capacity: number, endianness: Endianness) {
|
||||||
this.src = cursor;
|
this.output = new ResizableBufferCursor(new ResizableBuffer(capacity), endianness);
|
||||||
this.dst = new ResizableBufferCursor(new ResizableBuffer(cursor.size), cursor.endianness);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
set_bit(bit: number): void {
|
add_u8(value: number): void {
|
||||||
if (!this.flag_bits_left--) {
|
this.write_control_bit(1);
|
||||||
|
this.write_u8(value);
|
||||||
|
}
|
||||||
|
|
||||||
|
copy(offset: number, size: number): void {
|
||||||
|
if (offset > -256 && size <= 5) {
|
||||||
|
this.short_copy(offset, size);
|
||||||
|
} else {
|
||||||
|
this.long_copy(offset, size);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
finalize(): Cursor {
|
||||||
|
this.write_control_bit(0);
|
||||||
|
this.write_control_bit(1);
|
||||||
|
|
||||||
|
this.flags >>>= this.flag_bits_left;
|
||||||
|
const pos = this.output.position;
|
||||||
|
this.output
|
||||||
|
.seek_start(this.flag_offset)
|
||||||
|
.write_u8(this.flags)
|
||||||
|
.seek_start(pos);
|
||||||
|
|
||||||
|
this.write_u8(0);
|
||||||
|
this.write_u8(0);
|
||||||
|
return this.output.seek_start(0);
|
||||||
|
}
|
||||||
|
|
||||||
|
private write_control_bit(bit: number): void {
|
||||||
|
if (this.flag_bits_left-- === 0) {
|
||||||
// Write out the flags to their position in the file, and store the next flags byte position.
|
// Write out the flags to their position in the file, and store the next flags byte position.
|
||||||
const pos = this.dst.position;
|
const pos = this.output.position;
|
||||||
this.dst
|
this.output
|
||||||
.seek_start(this.flag_offset)
|
.seek_start(this.flag_offset)
|
||||||
.write_u8(this.flags)
|
.write_u8(this.flags)
|
||||||
.seek_start(pos)
|
.seek_start(pos)
|
||||||
@ -140,161 +111,31 @@ class Context {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
copy_literal(): void {
|
private write_u8(data: number): void {
|
||||||
this.dst.write_u8(this.src.u8());
|
this.output.write_u8(data);
|
||||||
}
|
}
|
||||||
|
|
||||||
write_literal(value: number): void {
|
private short_copy(offset: number, size: number): void {
|
||||||
this.dst.write_u8(value);
|
size -= 2;
|
||||||
|
this.write_control_bit(0);
|
||||||
|
this.write_control_bit(0);
|
||||||
|
this.write_control_bit((size >>> 1) & 1);
|
||||||
|
this.write_control_bit(size & 1);
|
||||||
|
this.write_u8(offset & 0xff);
|
||||||
}
|
}
|
||||||
|
|
||||||
write_final_flags(): void {
|
private long_copy(offset: number, size: number): void {
|
||||||
this.flags >>>= this.flag_bits_left;
|
if (size <= 9) {
|
||||||
const pos = this.dst.position;
|
this.write_control_bit(0);
|
||||||
this.dst
|
this.write_control_bit(1);
|
||||||
.seek_start(this.flag_offset)
|
this.write_u8(((offset << 3) & 0xf8) | ((size - 2) & 0x07));
|
||||||
.write_u8(this.flags)
|
this.write_u8((offset >> 5) & 0xff);
|
||||||
.seek_start(pos);
|
} else {
|
||||||
}
|
this.write_control_bit(0);
|
||||||
|
this.write_control_bit(1);
|
||||||
write_eof(): void {
|
this.write_u8((offset << 3) & 0xf8);
|
||||||
this.set_bit(0);
|
this.write_u8((offset >> 5) & 0xff);
|
||||||
this.set_bit(1);
|
this.write_u8(size - 1);
|
||||||
|
|
||||||
this.write_final_flags();
|
|
||||||
|
|
||||||
this.write_literal(0);
|
|
||||||
this.write_literal(0);
|
|
||||||
}
|
|
||||||
|
|
||||||
match_length(s2: number): number {
|
|
||||||
let len = 0;
|
|
||||||
let s1 = this.src.position;
|
|
||||||
const size = this.src.size;
|
|
||||||
|
|
||||||
while (s1 < size - 4 && this.src.u32_at(s1) === this.src.u32_at(s2)) {
|
|
||||||
len += 4;
|
|
||||||
s1 += 4;
|
|
||||||
s2 += 4;
|
|
||||||
}
|
|
||||||
|
|
||||||
while (s1 < size && this.src.u8_at(s1) === this.src.u8_at(s2)) {
|
|
||||||
++len;
|
|
||||||
++s1;
|
|
||||||
++s2;
|
|
||||||
}
|
|
||||||
|
|
||||||
return len;
|
|
||||||
}
|
|
||||||
|
|
||||||
find_longest_match(hash_table: HashTable, lazy: boolean): [number, number] {
|
|
||||||
if (!this.src.bytes_left) {
|
|
||||||
return [0, 0];
|
|
||||||
}
|
|
||||||
|
|
||||||
// Figure out where we're looking.
|
|
||||||
const hash = hash_table.hash(this.src);
|
|
||||||
|
|
||||||
// If there is nothing in the table at that point, bail out now.
|
|
||||||
let entry = hash_table.get(hash);
|
|
||||||
|
|
||||||
if (entry === -1) {
|
|
||||||
if (!lazy) {
|
|
||||||
hash_table.put(hash, this.src.position);
|
|
||||||
}
|
|
||||||
|
|
||||||
return [0, 0];
|
|
||||||
}
|
|
||||||
|
|
||||||
// If we'd go outside the window, truncate the hash chain now.
|
|
||||||
if (this.src.position - entry > MAX_WINDOW) {
|
|
||||||
hash_table.hash_to_offset[hash] = -1;
|
|
||||||
|
|
||||||
if (!lazy) {
|
|
||||||
hash_table.put(hash, this.src.position);
|
|
||||||
}
|
|
||||||
|
|
||||||
return [0, 0];
|
|
||||||
}
|
|
||||||
|
|
||||||
// Ok, we have something in the hash table that matches the hash value.
|
|
||||||
// Follow the chain to see if we have an actual string match, and find the longest match.
|
|
||||||
let longest_length = 0;
|
|
||||||
let longest_match = 0;
|
|
||||||
|
|
||||||
while (entry !== -1) {
|
|
||||||
const mlen = this.match_length(entry);
|
|
||||||
|
|
||||||
if (mlen > longest_length || mlen >= 256) {
|
|
||||||
longest_length = mlen;
|
|
||||||
longest_match = entry;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Follow the chain, making sure not to exceed a difference of MAX_WINDOW.
|
|
||||||
let entry_2 = hash_table.prev(entry);
|
|
||||||
|
|
||||||
if (entry_2 !== -1) {
|
|
||||||
// If we'd go outside the window, truncate the hash chain now.
|
|
||||||
if (this.src.position - entry_2 > MAX_WINDOW) {
|
|
||||||
hash_table.set_prev(entry, -1);
|
|
||||||
entry_2 = -1;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
entry = entry_2;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Add our current string to the hash.
|
|
||||||
if (!lazy) {
|
|
||||||
hash_table.put(hash, this.src.position);
|
|
||||||
}
|
|
||||||
|
|
||||||
// Did we find a match?
|
|
||||||
const offset = longest_length > 0 ? longest_match - this.src.position : 0;
|
|
||||||
return [offset, longest_length];
|
|
||||||
}
|
|
||||||
|
|
||||||
add_intermediates(hash_table: HashTable, len: number): void {
|
|
||||||
this.src.seek(1);
|
|
||||||
|
|
||||||
for (let i = 1; i < len; ++i) {
|
|
||||||
const hash = hash_table.hash(this.src);
|
|
||||||
hash_table.put(hash, this.src.position);
|
|
||||||
this.src.seek(1);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
class HashTable {
|
|
||||||
hash_to_offset = new Int32Array(HASH_SIZE).fill(-1);
|
|
||||||
masked_offset_to_prev = new Int16Array(MAX_WINDOW).fill(-1);
|
|
||||||
|
|
||||||
hash(cursor: Cursor): number {
|
|
||||||
let hash = cursor.u8();
|
|
||||||
|
|
||||||
if (cursor.bytes_left) {
|
|
||||||
hash ^= cursor.u8();
|
|
||||||
cursor.seek(-1);
|
|
||||||
}
|
|
||||||
|
|
||||||
cursor.seek(-1);
|
|
||||||
return hash;
|
|
||||||
}
|
|
||||||
|
|
||||||
get(hash: number): number {
|
|
||||||
return this.hash_to_offset[hash];
|
|
||||||
}
|
|
||||||
|
|
||||||
put(hash: number, offset: number): void {
|
|
||||||
this.set_prev(offset, this.hash_to_offset[hash]);
|
|
||||||
this.hash_to_offset[hash] = offset;
|
|
||||||
}
|
|
||||||
|
|
||||||
prev(offset: number): number {
|
|
||||||
return this.masked_offset_to_prev[offset & WINDOW_MASK];
|
|
||||||
}
|
|
||||||
|
|
||||||
set_prev(offset: number, prev_offset: number): void {
|
|
||||||
this.masked_offset_to_prev[offset & WINDOW_MASK] = prev_offset;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
300
src/data_formats/compression/prs/compress_high.ts
Normal file
300
src/data_formats/compression/prs/compress_high.ts
Normal file
@ -0,0 +1,300 @@
|
|||||||
|
import { Cursor } from "../../cursor/Cursor";
|
||||||
|
import { ResizableBufferCursor } from "../../cursor/ResizableBufferCursor";
|
||||||
|
import { WritableCursor } from "../../cursor/WritableCursor";
|
||||||
|
import { ResizableBuffer } from "../../ResizableBuffer";
|
||||||
|
|
||||||
|
export function prs_compress_high(src: Cursor): Cursor {
|
||||||
|
const ctx = new Context(src);
|
||||||
|
const hash_table = new HashTable();
|
||||||
|
|
||||||
|
if (ctx.src.size <= 3) {
|
||||||
|
// Make a literal copy of the input.
|
||||||
|
while (ctx.src.bytes_left) {
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.copy_literal();
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
// Add the first two "strings" to the hash table.
|
||||||
|
hash_table.put(hash_table.hash(ctx.src), 0);
|
||||||
|
ctx.src.seek(1);
|
||||||
|
hash_table.put(hash_table.hash(ctx.src), 1);
|
||||||
|
ctx.src.seek(-1);
|
||||||
|
|
||||||
|
// Copy the first two bytes as literals.
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.copy_literal();
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.copy_literal();
|
||||||
|
|
||||||
|
while (ctx.src.bytes_left > 1) {
|
||||||
|
let [offset, mlen] = ctx.find_longest_match(hash_table, false);
|
||||||
|
|
||||||
|
if (mlen > 0) {
|
||||||
|
ctx.src.seek(1);
|
||||||
|
const [offset2, mlen2] = ctx.find_longest_match(hash_table, true);
|
||||||
|
ctx.src.seek(-1);
|
||||||
|
|
||||||
|
// Did the "lazy match" produce something more compressed?
|
||||||
|
if (mlen2 > mlen) {
|
||||||
|
let copy_literal = true;
|
||||||
|
// Check if it is a good idea to switch from a short match to a long one.
|
||||||
|
if (mlen >= 2 && mlen <= 5 && offset2 < offset) {
|
||||||
|
if (offset >= -256 && offset2 < -256) {
|
||||||
|
if (mlen2 - mlen < 3) {
|
||||||
|
copy_literal = false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (copy_literal) {
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.copy_literal();
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// What kind of match did we find?
|
||||||
|
if (mlen >= 2 && mlen <= 5 && offset >= -256) {
|
||||||
|
// Short match.
|
||||||
|
ctx.set_bit(0);
|
||||||
|
ctx.set_bit(0);
|
||||||
|
ctx.set_bit((mlen - 2) & 0x02);
|
||||||
|
ctx.set_bit((mlen - 2) & 0x01);
|
||||||
|
ctx.write_literal(offset & 0xff);
|
||||||
|
ctx.add_intermediates(hash_table, mlen);
|
||||||
|
continue;
|
||||||
|
} else if (mlen >= 3 && mlen <= 9) {
|
||||||
|
// Long match, short length.
|
||||||
|
ctx.set_bit(0);
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.write_literal(((offset & 0x1f) << 3) | ((mlen - 2) & 0x07));
|
||||||
|
ctx.write_literal(offset >> 5);
|
||||||
|
ctx.add_intermediates(hash_table, mlen);
|
||||||
|
continue;
|
||||||
|
} else if (mlen > 9) {
|
||||||
|
// Long match, long length.
|
||||||
|
if (mlen > 256) {
|
||||||
|
mlen = 256;
|
||||||
|
}
|
||||||
|
|
||||||
|
ctx.set_bit(0);
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.write_literal((offset & 0x1f) << 3);
|
||||||
|
ctx.write_literal(offset >> 5);
|
||||||
|
ctx.write_literal(mlen - 1);
|
||||||
|
ctx.add_intermediates(hash_table, mlen);
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// If we get here, we didn't find a suitable match, so just we just make a literal copy.
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.copy_literal();
|
||||||
|
}
|
||||||
|
|
||||||
|
// If there's a left over byte at the end, make a literal copy.
|
||||||
|
if (ctx.src.bytes_left) {
|
||||||
|
ctx.set_bit(1);
|
||||||
|
ctx.copy_literal();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
ctx.write_eof();
|
||||||
|
|
||||||
|
return ctx.dst.seek_start(0);
|
||||||
|
}
|
||||||
|
|
||||||
|
const MAX_WINDOW = 0x2000;
|
||||||
|
const WINDOW_MASK = MAX_WINDOW - 1;
|
||||||
|
const HASH_SIZE = 1 << 8;
|
||||||
|
|
||||||
|
class Context {
|
||||||
|
src: Cursor;
|
||||||
|
dst: WritableCursor;
|
||||||
|
flags = 0;
|
||||||
|
flag_bits_left = 0;
|
||||||
|
flag_offset = 0;
|
||||||
|
|
||||||
|
constructor(cursor: Cursor) {
|
||||||
|
this.src = cursor;
|
||||||
|
this.dst = new ResizableBufferCursor(new ResizableBuffer(cursor.size), cursor.endianness);
|
||||||
|
}
|
||||||
|
|
||||||
|
set_bit(bit: number): void {
|
||||||
|
if (!this.flag_bits_left--) {
|
||||||
|
// Write out the flags to their position in the file, and store the next flags byte position.
|
||||||
|
const pos = this.dst.position;
|
||||||
|
this.dst
|
||||||
|
.seek_start(this.flag_offset)
|
||||||
|
.write_u8(this.flags)
|
||||||
|
.seek_start(pos)
|
||||||
|
.write_u8(0); // Placeholder for the next flags byte.
|
||||||
|
this.flag_offset = pos;
|
||||||
|
this.flag_bits_left = 7;
|
||||||
|
}
|
||||||
|
|
||||||
|
this.flags >>>= 1;
|
||||||
|
|
||||||
|
if (bit) {
|
||||||
|
this.flags |= 0x80;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
copy_literal(): void {
|
||||||
|
this.dst.write_u8(this.src.u8());
|
||||||
|
}
|
||||||
|
|
||||||
|
write_literal(value: number): void {
|
||||||
|
this.dst.write_u8(value);
|
||||||
|
}
|
||||||
|
|
||||||
|
write_final_flags(): void {
|
||||||
|
this.flags >>>= this.flag_bits_left;
|
||||||
|
const pos = this.dst.position;
|
||||||
|
this.dst
|
||||||
|
.seek_start(this.flag_offset)
|
||||||
|
.write_u8(this.flags)
|
||||||
|
.seek_start(pos);
|
||||||
|
}
|
||||||
|
|
||||||
|
write_eof(): void {
|
||||||
|
this.set_bit(0);
|
||||||
|
this.set_bit(1);
|
||||||
|
|
||||||
|
this.write_final_flags();
|
||||||
|
|
||||||
|
this.write_literal(0);
|
||||||
|
this.write_literal(0);
|
||||||
|
}
|
||||||
|
|
||||||
|
match_length(s2: number): number {
|
||||||
|
let len = 0;
|
||||||
|
let s1 = this.src.position;
|
||||||
|
const size = this.src.size;
|
||||||
|
|
||||||
|
while (s1 < size - 4 && this.src.u32_at(s1) === this.src.u32_at(s2)) {
|
||||||
|
len += 4;
|
||||||
|
s1 += 4;
|
||||||
|
s2 += 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
while (s1 < size && this.src.u8_at(s1) === this.src.u8_at(s2)) {
|
||||||
|
++len;
|
||||||
|
++s1;
|
||||||
|
++s2;
|
||||||
|
}
|
||||||
|
|
||||||
|
return len;
|
||||||
|
}
|
||||||
|
|
||||||
|
find_longest_match(hash_table: HashTable, lazy: boolean): [number, number] {
|
||||||
|
if (!this.src.bytes_left) {
|
||||||
|
return [0, 0];
|
||||||
|
}
|
||||||
|
|
||||||
|
// Figure out where we're looking.
|
||||||
|
const hash = hash_table.hash(this.src);
|
||||||
|
|
||||||
|
// If there is nothing in the table at that point, bail out now.
|
||||||
|
let entry = hash_table.get(hash);
|
||||||
|
|
||||||
|
if (entry === -1) {
|
||||||
|
if (!lazy) {
|
||||||
|
hash_table.put(hash, this.src.position);
|
||||||
|
}
|
||||||
|
|
||||||
|
return [0, 0];
|
||||||
|
}
|
||||||
|
|
||||||
|
// If we'd go outside the window, truncate the hash chain now.
|
||||||
|
if (this.src.position - entry > MAX_WINDOW) {
|
||||||
|
hash_table.hash_to_offset[hash] = -1;
|
||||||
|
|
||||||
|
if (!lazy) {
|
||||||
|
hash_table.put(hash, this.src.position);
|
||||||
|
}
|
||||||
|
|
||||||
|
return [0, 0];
|
||||||
|
}
|
||||||
|
|
||||||
|
// Ok, we have something in the hash table that matches the hash value.
|
||||||
|
// Follow the chain to see if we have an actual string match, and find the longest match.
|
||||||
|
let longest_length = 0;
|
||||||
|
let longest_match = 0;
|
||||||
|
|
||||||
|
while (entry !== -1) {
|
||||||
|
const mlen = this.match_length(entry);
|
||||||
|
|
||||||
|
if (mlen > longest_length || mlen >= 256) {
|
||||||
|
longest_length = mlen;
|
||||||
|
longest_match = entry;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Follow the chain, making sure not to exceed a difference of MAX_WINDOW.
|
||||||
|
let entry_2 = hash_table.prev(entry);
|
||||||
|
|
||||||
|
if (entry_2 !== -1) {
|
||||||
|
// If we'd go outside the window, truncate the hash chain now.
|
||||||
|
if (this.src.position - entry_2 > MAX_WINDOW) {
|
||||||
|
hash_table.set_prev(entry, -1);
|
||||||
|
entry_2 = -1;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
entry = entry_2;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Add our current string to the hash.
|
||||||
|
if (!lazy) {
|
||||||
|
hash_table.put(hash, this.src.position);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Did we find a match?
|
||||||
|
const offset = longest_length > 0 ? longest_match - this.src.position : 0;
|
||||||
|
return [offset, longest_length];
|
||||||
|
}
|
||||||
|
|
||||||
|
add_intermediates(hash_table: HashTable, len: number): void {
|
||||||
|
this.src.seek(1);
|
||||||
|
|
||||||
|
for (let i = 1; i < len; ++i) {
|
||||||
|
const hash = hash_table.hash(this.src);
|
||||||
|
hash_table.put(hash, this.src.position);
|
||||||
|
this.src.seek(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
class HashTable {
|
||||||
|
hash_to_offset = new Int32Array(HASH_SIZE).fill(-1);
|
||||||
|
masked_offset_to_prev = new Int16Array(MAX_WINDOW).fill(-1);
|
||||||
|
|
||||||
|
hash(cursor: Cursor): number {
|
||||||
|
let hash = cursor.u8();
|
||||||
|
|
||||||
|
if (cursor.bytes_left) {
|
||||||
|
hash ^= cursor.u8();
|
||||||
|
cursor.seek(-1);
|
||||||
|
}
|
||||||
|
|
||||||
|
cursor.seek(-1);
|
||||||
|
return hash;
|
||||||
|
}
|
||||||
|
|
||||||
|
get(hash: number): number {
|
||||||
|
return this.hash_to_offset[hash];
|
||||||
|
}
|
||||||
|
|
||||||
|
put(hash: number, offset: number): void {
|
||||||
|
this.set_prev(offset, this.hash_to_offset[hash]);
|
||||||
|
this.hash_to_offset[hash] = offset;
|
||||||
|
}
|
||||||
|
|
||||||
|
prev(offset: number): number {
|
||||||
|
return this.masked_offset_to_prev[offset & WINDOW_MASK];
|
||||||
|
}
|
||||||
|
|
||||||
|
set_prev(offset: number, prev_offset: number): void {
|
||||||
|
this.masked_offset_to_prev[offset & WINDOW_MASK] = prev_offset;
|
||||||
|
}
|
||||||
|
}
|
@ -28,27 +28,27 @@ function test_with_bytes(bytes: number[], expected_compressed_size: number): voi
|
|||||||
}
|
}
|
||||||
|
|
||||||
test("PRS compression and decompression, best case", () => {
|
test("PRS compression and decompression, best case", () => {
|
||||||
// Compression factor: 0.018
|
// Compression factor: 0.048
|
||||||
test_with_bytes(new Array(1000).fill(128), 18);
|
test_with_bytes(new Array(10000).fill(128), 475);
|
||||||
});
|
});
|
||||||
|
|
||||||
test("PRS compression and decompression, worst case", () => {
|
test("PRS compression and decompression, worst case", () => {
|
||||||
const prng = new Prng();
|
const prng = new Prng();
|
||||||
|
|
||||||
// Compression factor: 1.124
|
// Compression factor: 1.125
|
||||||
test_with_bytes(new Array(1000).fill(0).map(() => prng.next_integer(0, 255)), 1124);
|
test_with_bytes(new Array(10000).fill(0).map(() => prng.next_integer(0, 255)), 11253);
|
||||||
});
|
});
|
||||||
|
|
||||||
test("PRS compression and decompression, typical case", () => {
|
test("PRS compression and decompression, typical case", () => {
|
||||||
const prng = new Prng();
|
const prng = new Prng();
|
||||||
const pattern = [0, 0, 2, 0, 3, 0, 5, 0, 0, 0, 7, 9, 11, 13, 0, 0];
|
const pattern = [0, 0, 2, 0, 3, 0, 5, 0, 0, 0, 7, 9, 11, 13, 0, 0];
|
||||||
const arrays = new Array(100)
|
const arrays = new Array(1000)
|
||||||
.fill(pattern)
|
.fill(pattern)
|
||||||
.map(array => array.map((e: number) => e + prng.next_integer(0, 10)));
|
.map(array => array.map((e: number) => e + prng.next_integer(0, 10)));
|
||||||
const flattened_array = [].concat.apply([], arrays);
|
const flattened_array = [].concat.apply([], arrays);
|
||||||
|
|
||||||
// Compression factor: 0.834
|
// Compression factor: 0.933
|
||||||
test_with_bytes(flattened_array, 1335);
|
test_with_bytes(flattened_array, 14924);
|
||||||
});
|
});
|
||||||
|
|
||||||
test("PRS compression and decompression, 0 bytes", () => {
|
test("PRS compression and decompression, 0 bytes", () => {
|
||||||
|
@ -125,7 +125,7 @@ export function write_quest_qst(quest: Quest, file_name: string): ArrayBuffer {
|
|||||||
);
|
);
|
||||||
const ext_start = file_name.lastIndexOf(".");
|
const ext_start = file_name.lastIndexOf(".");
|
||||||
const base_file_name =
|
const base_file_name =
|
||||||
ext_start === -1 ? file_name.slice(0, 12) : file_name.slice(0, Math.min(12, ext_start));
|
ext_start === -1 ? file_name.slice(0, 11) : file_name.slice(0, Math.min(11, ext_start));
|
||||||
|
|
||||||
return write_qst({
|
return write_qst({
|
||||||
files: [
|
files: [
|
||||||
|
@ -249,8 +249,8 @@ function parse_files(cursor: Cursor, expected_sizes: Map<string, number>): QstCo
|
|||||||
|
|
||||||
function write_file_headers(cursor: WritableCursor, files: QstContainedFileParam[]): void {
|
function write_file_headers(cursor: WritableCursor, files: QstContainedFileParam[]): void {
|
||||||
for (const file of files) {
|
for (const file of files) {
|
||||||
if (file.name.length > 16) {
|
if (file.name.length > 15) {
|
||||||
throw new Error(`File ${file.name} has a name longer than 16 characters.`);
|
throw new Error(`File ${file.name} has a name longer than 15 characters.`);
|
||||||
}
|
}
|
||||||
|
|
||||||
cursor.write_u16(88); // Header size.
|
cursor.write_u16(88); // Header size.
|
||||||
|
Loading…
Reference in New Issue
Block a user