iwa-inspector/src/iwa.ts
2023-12-14 22:13:56 -05:00

417 lines
16 KiB
TypeScript

import * as CFB from 'cfb';
import Messages, { $_TSP_MessageInfo, MessageTypes } from "./messages/";
/* see https://bugs.webkit.org/show_bug.cgi?id=243148 -- affects iOS Safari */
declare const Buffer: any; // Buffer is typeof-guarded but TS still needs this :(
const subarray: "subarray" | "slice" = (() => {
try {
if(typeof Uint8Array == "undefined") return "slice";
if(typeof Uint8Array.prototype.subarray == "undefined") return "slice";
// NOTE: feature tests are for node < 6.x
if(typeof Buffer !== "undefined") {
if(typeof Buffer.prototype.subarray == "undefined") return "slice";
if((typeof Buffer.from == "function" ? Buffer.from([72,62]) : new Buffer([72,62])) instanceof Uint8Array) return "subarray";
return "slice";
}
return "subarray";
} catch(e) { return "slice"; }
})();
/** Concatenate Uint8Arrays */
function u8concat(u8a: Uint8Array[]): Uint8Array {
let len = 0;
for(let i = 0; i < u8a.length; ++i) len += u8a[i].length;
const out = new Uint8Array(len);
let off = 0;
for(let i = 0; i < u8a.length; ++i) {
const u8 = u8a[i], L = u8.length;
if(L < 250) { for(let j = 0; j < L; ++j) out[off++] = u8[j]; }
else { out.set(u8, off); off += L; }
}
return out;
}
interface Ptr { l: number; }
/** Parse an integer from the varint that can be exactly stored in a double */
function parse_varint49(buf: Uint8Array, ptr: Ptr): number {
let l = ptr.l;
let usz = buf[l] & 0x7F;
varint: if(buf[l++] >= 0x80) {
usz |= (buf[l] & 0x7F) << 7; if(buf[l++] < 0x80) break varint;
usz |= (buf[l] & 0x7F) << 14; if(buf[l++] < 0x80) break varint;
usz |= (buf[l] & 0x7F) << 21; if(buf[l++] < 0x80) break varint;
usz += (buf[l] & 0x7F) * Math.pow(2, 28); ++l; if(buf[l++] < 0x80) break varint;
usz += (buf[l] & 0x7F) * Math.pow(2, 35); ++l; if(buf[l++] < 0x80) break varint;
usz += (buf[l] & 0x7F) * Math.pow(2, 42); ++l; if(buf[l++] < 0x80) break varint;
}
ptr.l = l;
return usz;
}
/** Parse a repeated varint [packed = true] field */
function parse_packed_varints(buf: Uint8Array): number[] {
const ptr: Ptr = {l: 0};
const out: number[] = [];
while(ptr.l < buf.length) out.push(parse_varint49(buf, ptr));
return out;
}
/** Parse a BigInt from the varint */
function parse_varint64(buf: Uint8Array, ptr: Ptr): bigint {
let l = ptr.l;
let usz = BigInt(buf[l] & 0x7F);
varint: if(buf[l++] >= 0x80) {
usz += BigInt(buf[l] & 0x7F) << 7n; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 14n; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 21n; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 28n; ++l; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 35n; ++l; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 42n; ++l; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 49n; ++l; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 56n; ++l; if(buf[l++] < 0x80) break varint;
usz += BigInt(buf[l] & 0x7F) << 63n; ++l; if(buf[l++] < 0x80) break varint;
}
ptr.l = l;
return usz;
}
/** Parse a repeated varint [packed = true] field */
function parse_packed_varint64(buf: Uint8Array): bigint[] {
const ptr: Ptr = {l: 0};
const out: bigint[] = [];
while(ptr.l < buf.length) out.push(parse_varint64(buf, ptr));
return out;
}
/** Parse a 32-bit signed integer from the raw varint */
function varint_to_i32(buf: Uint8Array): number {
let l = 0,
i32 = (buf[l] & 0x7F) ; if(buf[l++] < 0x80) return i32;
i32 |= (buf[l] & 0x7F) << 7; if(buf[l++] < 0x80) return i32;
i32 |= (buf[l] & 0x7F) << 14; if(buf[l++] < 0x80) return i32;
i32 |= (buf[l] & 0x7F) << 21; if(buf[l++] < 0x80) return i32;
i32 |= (buf[l] & 0x0F) << 28; return i32;
}
/** Parse a 64-bit unsigned integer as a pair */
function varint_to_u64(buf: Uint8Array): [number, number] {
let l = 0, lo = buf[l] & 0x7F, hi = 0;
varint: if(buf[l++] >= 0x80) {
lo |= (buf[l] & 0x7F) << 7; if(buf[l++] < 0x80) break varint;
lo |= (buf[l] & 0x7F) << 14; if(buf[l++] < 0x80) break varint;
lo |= (buf[l] & 0x7F) << 21; if(buf[l++] < 0x80) break varint;
lo |= (buf[l] & 0x7F) << 28; hi = (buf[l] >> 4) & 0x07; if(buf[l++] < 0x80) break varint;
hi |= (buf[l] & 0x7F) << 3; if(buf[l++] < 0x80) break varint;
hi |= (buf[l] & 0x7F) << 10; if(buf[l++] < 0x80) break varint;
hi |= (buf[l] & 0x7F) << 17; if(buf[l++] < 0x80) break varint;
hi |= (buf[l] & 0x7F) << 24; if(buf[l++] < 0x80) break varint;
hi |= (buf[l] & 0x7F) << 31;
}
return [lo >>> 0, hi >>> 0];
}
export { varint_to_i32, varint_to_u64 };
interface ProtoItem {
data: Uint8Array;
type: number;
}
type ProtoField = Array<ProtoItem>;
type ProtoMessage = Array<ProtoField>;
interface IWAMessage {
/** Metadata in .TSP.MessageInfo */
meta: ProtoMessage;
rawmeta: Uint8Array;
data: Uint8Array;
pre?: string;
parsed?: any;
parsedmeta?: $_TSP_MessageInfo;
}
interface IWAArchiveInfo {
id: number;
merge?: boolean;
messages: IWAMessage[];
}
/** Shallow parse of a Protobuf message */
function parse_shallow(buf: Uint8Array): ProtoMessage {
const out: ProtoMessage = [], ptr: Ptr = {l: 0};
while(ptr.l < buf.length) {
const off = ptr.l;
let num = parse_varint49(buf, ptr);
const type = num & 0x07;
num = (num / 8)|0;
let data: Uint8Array;
let l = ptr.l;
switch(type) {
case 0: {
while(buf[l++] >= 0x80);
data = buf[subarray](ptr.l, l);
ptr.l = l;
} break;
case 1: { data = buf[subarray](l, l + 8); ptr.l = l + 8; } break;
case 2: {
const len = parse_varint49(buf, ptr);
data = buf[subarray](ptr.l, ptr.l + len);
ptr.l += len;
} break;
case 5: { data = buf[subarray](l, l + 4); ptr.l = l + 4; } break;
default: throw new Error(`PB Type ${type} for Field ${num} at offset ${off}`);
}
const v: ProtoItem = { data, type };
if(out[num] == null) out[num] = [];
out[num].push(v);
}
return out;
}
/** Extract all messages from a IWA file */
function parse_iwa_file(buf: Uint8Array): IWAArchiveInfo[] {
const out: IWAArchiveInfo[] = [], ptr: Ptr = {l: 0};
while(ptr.l < buf.length) {
/* .TSP.ArchiveInfo */
const len = parse_varint49(buf, ptr);
const ai = parse_shallow(buf[subarray](ptr.l, ptr.l + len));
ptr.l += len;
const res: IWAArchiveInfo = {
/* TODO: technically ID is optional */
id: varint_to_i32(ai[1][0].data),
messages: []
};
ai[2].forEach(b => {
const mi = parse_shallow(b.data);
const fl = varint_to_i32(mi[3][0].data);
res.messages.push({
meta: mi,
rawmeta: b.data,
data: buf[subarray](ptr.l, ptr.l + fl)
});
ptr.l += fl;
});
if(ai[3]?.[0]) res.merge = (varint_to_i32(ai[3][0].data) >>> 0) > 0;
out.push(res);
}
return out;
}
/** Decompress a snappy chunk */
function parse_snappy_chunk(type: number, buf: Uint8Array): Uint8Array[] {
if(type != 0) throw new Error(`Unexpected Snappy chunk type ${type}`);
const ptr: Ptr = {l: 0};
const usz = parse_varint49(buf, ptr);
let chunks: Uint8Array[] = [];
let l = ptr.l;
while(l < buf.length) {
const tag = buf[l] & 0x3;
if(tag == 0) {
let len = buf[l++] >> 2;
if(len < 60) ++len;
else {
const c = len - 59;
len = buf[l];
if(c > 1) len |= (buf[l+1]<<8);
if(c > 2) len |= (buf[l+2]<<16);
if(c > 3) len |= (buf[l+3]<<24);
len >>>=0; len++;
l += c;
}
chunks.push(buf[subarray](l, l + len)); l += len; continue;
} else {
let offset = 0, length = 0;
if(tag == 1) {
length = ((buf[l] >> 2) & 0x7) + 4;
offset = (buf[l++] & 0xE0) << 3;
offset |= buf[l++];
} else {
length = (buf[l++] >> 2) + 1;
if(tag == 2) { offset = buf[l] | (buf[l+1]<<8); l += 2; }
else { offset = (buf[l] | (buf[l+1]<<8) | (buf[l+2]<<16) | (buf[l+3]<<24))>>>0; l += 4; }
}
if(offset == 0) throw new Error("Invalid offset 0");
let j = chunks.length - 1, off = offset;
while(j >=0 && off >= chunks[j].length) { off -= chunks[j].length; --j; }
if(j < 0) {
if(off == 0) off = chunks[(j = 0)].length;
else throw new Error("Invalid offset beyond length");
}
// Node 0.8 Buffer slice does not support negative indices
if(length < off) chunks.push(chunks[j][subarray](chunks[j].length-off, chunks[j].length-off + length));
else {
if(off > 0) { chunks.push(chunks[j][subarray](chunks[j].length-off)); length -= off; } ++j;
while(length >= chunks[j].length) { chunks.push(chunks[j]); length -= chunks[j].length; ++j; }
if(length) chunks.push(chunks[j][subarray](0, length));
}
if(chunks.length > 25) chunks = [u8concat(chunks)];
}
}
let clen = 0; for(let u8i = 0; u8i < chunks.length; ++u8i) clen += chunks[u8i].length;
if(clen != usz) throw new Error(`Unexpected length: ${clen} != ${usz}`);
return chunks;
}
/** Decompress IWA file */
function decompress_iwa_file(buf: Uint8Array): Uint8Array {
if(Array.isArray(buf)) buf = new Uint8Array(buf);
const out: Uint8Array[] = [];
let l = 0;
while(l < buf.length) {
const t = buf[l++];
const len = buf[l] | (buf[l+1]<<8) | (buf[l+2] << 16); l += 3;
out.push(...parse_snappy_chunk(t, buf[subarray](l, l + len)));
l += len;
}
if(l !== buf.length) throw new Error("data is not a valid framed stream!");
return out.length == 1 ? out[0] : u8concat(out);
}
type MessageSpace = {[id: number]: IWAMessage[]};
type TableItem = { id: number; path: string; type: number; message: string; };
interface ParsedFile {
space: MessageSpace;
tbl: TableItem[];
type: MessageTypes;
}
function parse_iwa(cfb: CFB.CFB$Container): ParsedFile {
const M: MessageSpace = {}, indices: number[] = [], tbl: TableItem[] = [];
cfb.FullPaths.forEach(p => { if(p.match(/\.iwpv2/)) throw new Error(`Unsupported password protection`); });
let root!: TableItem, rootmsg!: IWAMessage;
/* collect entire message space */
cfb.FileIndex.forEach((s, idx) => {
if(!s.name.match(/\.iwa$/)) return;
if(s.content[0] != 0) return; // TODO: this should test if the iwa follows the framing format
let o: Uint8Array;
try { o = decompress_iwa_file(s.content as Uint8Array); } catch(e: any) { return console.log("?? " + s.content.length + " " + ((e as Error).message || e)); }
let packets: IWAArchiveInfo[];
try { packets = parse_iwa_file(o); } catch(e: any) { return console.log("## " + ((e as Error).message || e)); }
packets.forEach(packet => { M[packet.id] = packet.messages; indices.push(packet.id);
const type = varint_to_i32(packet.messages[0].meta[1][0].data);
const item = {
id: packet.id,
type,
path:cfb.FullPaths[idx].replace(/Root Entry/, ""),
message: "??"
};
if(item.id == 1) { root = item; rootmsg = packet.messages[0]; }
tbl.push(item);
});
});
if(!indices.length) throw new Error("File has no messages");
if(!root) throw new Error(`Root element (id 1) missing!`);
let type: MessageTypes = "N";
if(root.type == 10000) type = "P";
else if(parse_shallow(rootmsg.data)?.[2]?.[0]) type = "K";
tbl.forEach(item => item.message = Messages[type][item.type] || "??");
return { space: M, tbl, type };
}
function process_item(item: {data: Uint8Array; type: number}, type: string, protos: any) {
switch(item.type) {
case 0: {
const varint = parse_varint49(item.data, {l:0});
switch(type) {
case "bool": return !!+varint;
case "uint32": return varint;
case "int32": return varint | 0;
case "sint32": return (-(varint&1))^(varint>>1);
case "uint64": { const u64 = varint_to_u64(item.data); return (BigInt(u64[1])<<32n) + BigInt(u64[0]); }
case "int64": { const u64 = varint_to_u64(item.data); return new BigInt64Array([(BigInt(u64[1])<<32n) + BigInt(u64[0])])[0]; }
case "sint64": { const u64 = varint_to_u64(item.data); const bi = (BigInt(u64[1])<<32n) + BigInt(u64[0]); return (-(bi&1n))^(bi>>1n); }
}
} break;
case 1: switch(type) {
case "fixed64": return new BigUint64Array(new Uint8Array([...item.data]).buffer)[0];
case "sfixed64": return new BigInt64Array(new Uint8Array([...item.data]).buffer)[0];
case "double": return new Float64Array(new Uint8Array([...item.data]).buffer)[0];
} break;
case 2: switch(type) {
case "string": return new TextDecoder().decode(item.data);
case "bytes": return item.data;
} break;
case 5: switch(type) {
case "float": return new Float32Array(new Uint8Array([...item.data]).buffer)[0];
case "fixed32": return new Uint32Array(new Uint8Array([...item.data]).buffer)[0];
case "sfixed32": return new Int32Array(new Uint8Array([...item.data]).buffer)[0];
}
}
if(protos[type]) return process(item.data, type, protos);
console.error(item);
return item;
}
function process_enum(data: Uint8Array, message: string, protos: any) {
let val = parse_varint49(data, {l: 0});
if(val >= 4294967296) val |= 0;
const msg = protos[message].split("\n");
for(const m of msg) {
if(m.startsWith("enum")) continue;
if(m.indexOf("=")> -1) {
const [field, , value] = m.trim().split(" ");
if(val == parseInt(value, 10)) {
const res = {}
Object.defineProperty(res, "value", { get: () => val});
Object.defineProperty(res, "PB_ENUM", { value: field, enumerable: false})
return res;
}
}
}
throw [val, message, protos[message]];
}
function process(data: Uint8Array, message: string, protos: any) {
if(!protos[message]) return parse_shallow(data);
const shallow = parse_shallow(data);
const proto: string[] = protos[message].split("\n");
const out: any = {};
if(proto[0].startsWith("enum")) return process_enum(data, message, protos);
proto.forEach(line => {
if(!line.startsWith(" ") || line.indexOf("=") == -1 || line.startsWith(" ")) return;
const [freq, type, name, , idx] = line.trim().split(/\s+/);
const i = parseInt(idx, 10);
if(isNaN(i)) return;
if(!shallow[i]?.length) return;
switch(freq) {
case "repeated": {
if(/packed\s*=\s*true/.test(line)) {
/* these are the known types as of iwa 13.2 */
switch(type) {
case "uint32": out[name] = parse_packed_varints(shallow[i][0].data); break;
case "uint64": out[name] = parse_packed_varint64(shallow[i][0].data); break;
case "fixed64": out[name] = new BigUint64Array(new Uint8Array(shallow[i][0].data).buffer); break;
default:
console.log(shallow[i][0], line);
throw new Error(`unsupported packed field of type ${type}`);
}
} else out[name] = shallow[i].map(item => protos[type]?.startsWith("enum") ? process_enum(item.data, type, protos) : process_item(item, type, protos));
} break;
case "required": case "optional": out[name] = protos[type]?.startsWith("enum") ? process_enum(shallow[i][0].data, type, protos) : process_item(shallow[i][0], type, protos); break
default: throw `unsupported frequency ${freq}`;
}
if(type.startsWith(".")) {
if(freq == "repeated") out[name].forEach((n: any) => {try { Object.defineProperty(n, "PB_TYPE", {value: type, enumerable: false}); } catch(e){/*empty*/}});
else try { Object.defineProperty(out[name], "PB_TYPE", {value: type, enumerable: false}); } catch(e) {/*empty*/}
}
try {
if(freq == "repeated") out[name].forEach((n: any, idx:number) => {try { Object.defineProperty(n, "PB_RAW", {value: shallow[i][idx], enumerable: false}); } catch(e){/*empty*/}});
else try { Object.defineProperty(out[name], "PB_RAW", {value: shallow[i][0], enumerable: false}); } catch(e) {/*empty*/}
} catch(e){console.log(e);}
try {
if(freq == "repeated") out[name].forEach((n: any, idx:number) => {try { Object.defineProperty(n, "PB_FIELD", {value: `${name}[${idx}]` , enumerable: false}); } catch(e){/*empty*/}});
else try { Object.defineProperty(out[name], "PB_FIELD", {value: name, enumerable: false}); } catch(e) {/*empty*/}
} catch(e){console.log(e);}
})
return out;
}
function read(ab: ArrayBuffer): ParsedFile {
let cfb: CFB.CFB$Container;
try {
cfb = CFB.read(new Uint8Array(ab), {type: "buffer"});
} catch(e) { throw new Error(`Failed to read archive: |${e&&(e as any).message||e}|`); }
return parse_iwa(cfb);
}
export { parse_iwa, read, process }
export type { MessageSpace, TableItem, ParsedFile };