sheetjs_sheetjs/modules/83_numbers.ts

1362 lines
52 KiB
TypeScript
Raw Normal View History

2022-01-29 02:29:34 +00:00
/*! sheetjs (C) 2013-present SheetJS -- http://sheetjs.com */
/// <reference path="src/types.ts"/>
2022-01-29 02:29:34 +00:00
2022-03-21 01:39:16 +00:00
/* these are type imports and do not show up in the generated JS */
import { CFB$Container, CFB$Entry } from 'cfb';
2022-07-13 07:52:29 +00:00
import { WorkBook, WorkSheet, Range, CellObject, ParsingOptions, WritingOptions } from '../';
import type { utils } from "../";
declare var encode_cell: typeof utils.encode_cell;
declare var encode_range: typeof utils.encode_range;
declare var book_new: typeof utils.book_new;
declare var book_append_sheet: typeof utils.book_append_sheet;
declare var sheet_to_json: typeof utils.sheet_to_json;
declare var decode_range: typeof utils.decode_range;
import * as _CFB from 'cfb';
declare var CFB: typeof _CFB;
2022-03-21 01:39:16 +00:00
//<<import { utils } from "../../";
//<<const { encode_cell, encode_range, book_new, book_append_sheet } = utils;
/* see https://bugs.webkit.org/show_bug.cgi?id=243148 -- affects iOS Safari */
declare var Buffer: any; // Buffer is typeof-guarded but TS still needs this :(
2022-07-16 22:07:53 +00:00
var subarray: "subarray" | "slice" = (() => {
try {
if(typeof Uint8Array == "undefined") return "slice";
if(typeof Uint8Array.prototype.subarray == "undefined") return "slice";
// NOTE: feature tests are for node < 6.x
if(typeof Buffer !== "undefined") {
if(typeof Buffer.prototype.subarray == "undefined") return "slice";
if((typeof Buffer.from == "function" ? Buffer.from([72,62]) : new Buffer([72,62])) instanceof Uint8Array) return "subarray";
return "slice";
}
return "subarray";
} catch(e) { return "slice"; }
})();
2022-07-13 07:52:29 +00:00
2022-03-21 01:39:16 +00:00
function u8_to_dataview(array: Uint8Array): DataView { return new DataView(array.buffer, array.byteOffset, array.byteLength); }
//<<export { u8_to_dataview };
2022-03-21 01:39:16 +00:00
function u8str(u8: Uint8Array): string { return /* Buffer.isBuffer(u8) ? u8.toString() :*/ typeof TextDecoder != "undefined" ? new TextDecoder().decode(u8) : utf8read(a2s(u8)); }
function stru8(str: string): Uint8Array { return typeof TextEncoder != "undefined" ? new TextEncoder().encode(str) : s2a(utf8write(str)) as Uint8Array; }
//<<export { u8str, stru8 };
function u8contains(body: Uint8Array, search: Uint8Array): boolean {
var L = body.indexOf(search[0]);
if(L == -1) return false;
outer: for(; L <= body.length - search.length; ++L) {
2022-03-25 00:12:55 +00:00
for(var j = 0; j < search.length; ++j) if(body[L+j] != search[j]) continue outer;
return true;
}
return false;
}
//<<export { u8contains }
2022-03-21 01:39:16 +00:00
/** Concatenate Uint8Arrays */
function u8concat(u8a: Uint8Array[]): Uint8Array {
var len = u8a.reduce((acc: number, x: Uint8Array) => acc + x.length, 0);
var out = new Uint8Array(len);
var off = 0;
u8a.forEach(u8 => { out.set(u8, off); off += u8.length; });
return out;
2022-03-21 01:39:16 +00:00
}
//<<export { u8concat };
2022-03-21 01:39:16 +00:00
/** Count the number of bits set (assuming int32_t interpretation) */
function popcnt(x: number): number {
2022-03-25 00:12:55 +00:00
x -= ((x >> 1) & 0x55555555);
x = (x & 0x33333333) + ((x >> 2) & 0x33333333);
return (((x + (x >> 4)) & 0x0F0F0F0F) * 0x01010101) >>> 24;
2022-03-21 01:39:16 +00:00
}
2022-03-21 01:39:16 +00:00
/** Read a 128-bit decimal from the modern cell storage */
function readDecimal128LE(buf: Uint8Array, offset: number): number {
var exp = ((buf[offset + 15] & 0x7F) << 7) | (buf[offset + 14] >> 1);
var mantissa = buf[offset + 14] & 1;
for(var j = offset + 13; j >= offset; --j) mantissa = mantissa * 256 + buf[j];
return ((buf[offset+15] & 0x80) ? -mantissa : mantissa) * Math.pow(10, exp - 0x1820);
2022-03-21 01:39:16 +00:00
}
/** Write a 128-bit decimal to the modern cell storage */
function writeDecimal128LE(buf: Uint8Array, offset: number, value: number): void {
// TODO: something more correct than this
2022-03-26 21:50:27 +00:00
var exp = Math.floor(value == 0 ? 0 : /*Math.log10*/Math.LOG10E * Math.log(Math.abs(value))) + 0x1820 - 16;
var mantissa = (value / Math.pow(10, exp - 0x1820));
buf[offset+15] |= exp >> 7;
buf[offset+14] |= (exp & 0x7F) << 1;
for(var i = 0; mantissa >= 1; ++i, mantissa /= 256) buf[offset + i] = mantissa & 0xFF;
buf[offset+15] |= (value >= 0 ? 0 : 0x80);
}
type Ptr = [number];
/** Parse an integer from the varint that can be exactly stored in a double */
function parse_varint49(buf: Uint8Array, ptr?: Ptr): number {
var l = ptr ? ptr[0] : 0;
var usz = buf[l] & 0x7F;
varint: if(buf[l++] >= 0x80) {
usz |= (buf[l] & 0x7F) << 7; if(buf[l++] < 0x80) break varint;
usz |= (buf[l] & 0x7F) << 14; if(buf[l++] < 0x80) break varint;
usz |= (buf[l] & 0x7F) << 21; if(buf[l++] < 0x80) break varint;
usz += (buf[l] & 0x7F) * Math.pow(2, 28); ++l; if(buf[l++] < 0x80) break varint;
usz += (buf[l] & 0x7F) * Math.pow(2, 35); ++l; if(buf[l++] < 0x80) break varint;
usz += (buf[l] & 0x7F) * Math.pow(2, 42); ++l; if(buf[l++] < 0x80) break varint;
}
if(ptr) ptr[0] = l;
return usz;
}
2022-04-11 04:11:47 +00:00
/** Write a varint up to 7 bytes / 49 bits */
function write_varint49(v: number): Uint8Array {
var usz = new Uint8Array(7);
usz[0] = (v & 0x7F);
var L = 1;
sz: if(v > 0x7F) {
usz[L-1] |= 0x80; usz[L] = (v >> 7) & 0x7F; ++L;
if(v <= 0x3FFF) break sz;
usz[L-1] |= 0x80; usz[L] = (v >> 14) & 0x7F; ++L;
if(v <= 0x1FFFFF) break sz;
usz[L-1] |= 0x80; usz[L] = (v >> 21) & 0x7F; ++L;
if(v <= 0xFFFFFFF) break sz;
usz[L-1] |= 0x80; usz[L] = ((v/0x100) >>> 21) & 0x7F; ++L;
if(v <= 0x7FFFFFFFF) break sz;
usz[L-1] |= 0x80; usz[L] = ((v/0x10000) >>> 21) & 0x7F; ++L;
if(v <= 0x3FFFFFFFFFF) break sz;
usz[L-1] |= 0x80; usz[L] = ((v/0x1000000) >>> 21) & 0x7F; ++L;
}
2022-07-13 07:52:29 +00:00
return usz[subarray](0, L);
}
/** Parse a repeated varint [packed = true] field */
function parse_packed_varints(buf: Uint8Array): number[] {
var ptr: Ptr = [0];
var out: number[] = [];
while(ptr[0] < buf.length) out.push(parse_varint49(buf, ptr));
return out;
}
/** Write a repeated varint [packed = true] field */
function write_packed_varints(nums: number[]): Uint8Array {
return u8concat(nums.map(x => write_varint49(x)));
}
//<<export { parse_varint49, write_varint49 };
/** Parse a 32-bit signed integer from the raw varint */
function varint_to_i32(buf: Uint8Array): number {
var l = 0, i32 = buf[l] & 0x7F;
varint: if(buf[l++] >= 0x80) {
i32 |= (buf[l] & 0x7F) << 7; if(buf[l++] < 0x80) break varint;
i32 |= (buf[l] & 0x7F) << 14; if(buf[l++] < 0x80) break varint;
i32 |= (buf[l] & 0x7F) << 21; if(buf[l++] < 0x80) break varint;
i32 |= (buf[l] & 0x7F) << 28;
}
return i32;
}
//<<export { varint_to_i32 };
interface ProtoItem {
data: Uint8Array;
type: number;
}
type ProtoField = Array<ProtoItem>
type ProtoMessage = Array<ProtoField>;
2022-03-21 01:39:16 +00:00
/** Shallow parse of a Protobuf message */
function parse_shallow(buf: Uint8Array): ProtoMessage {
var out: ProtoMessage = [], ptr: Ptr = [0];
while(ptr[0] < buf.length) {
var off = ptr[0];
var num = parse_varint49(buf, ptr);
var type = num & 0x07; num = Math.floor(num / 8);
var len = 0;
var res: Uint8Array;
if(num == 0) break;
switch(type) {
case 0: {
var l = ptr[0];
while(buf[ptr[0]++] >= 0x80);
2022-07-13 07:52:29 +00:00
res = buf[subarray](l, ptr[0]);
} break;
2022-07-13 07:52:29 +00:00
case 5: len = 4; res = buf[subarray](ptr[0], ptr[0] + len); ptr[0] += len; break;
case 1: len = 8; res = buf[subarray](ptr[0], ptr[0] + len); ptr[0] += len; break;
case 2: len = parse_varint49(buf, ptr); res = buf[subarray](ptr[0], ptr[0] + len); ptr[0] += len; break;
case 3: // Start group
case 4: // End group
default: throw new Error(`PB Type ${type} for Field ${num} at offset ${off}`);
}
var v: ProtoItem = { data: res, type };
if(out[num] == null) out[num] = [v];
else out[num].push(v);
}
return out;
}
/** Serialize a shallow parse */
function write_shallow(proto: ProtoMessage): Uint8Array {
var out: Uint8Array[] = [];
proto.forEach((field, idx) => {
2022-03-25 00:12:55 +00:00
if(idx == 0) return;
field.forEach(item => {
if(!item.data) return;
out.push(write_varint49(idx * 8 + item.type));
if(item.type == 2) out.push(write_varint49(item.data.length));
out.push(item.data);
});
});
return u8concat(out);
}
//<<export { parse_shallow, write_shallow };
2022-03-21 01:39:16 +00:00
/** Map over each entry in a repeated (or single-value) field */
function mappa<U>(data: ProtoField, cb:(Uint8Array) => U): U[] {
return data?.map(d => cb(d.data)) || [];
}
interface IWAMessage {
/** Metadata in .TSP.MessageInfo */
meta: ProtoMessage;
data: Uint8Array;
}
interface IWAArchiveInfo {
2022-07-08 22:31:08 +00:00
id: number;
merge?: boolean;
2022-07-08 22:31:08 +00:00
messages: IWAMessage[];
}
2022-03-21 01:39:16 +00:00
/** Extract all messages from a IWA file */
function parse_iwa_file(buf: Uint8Array): IWAArchiveInfo[] {
var out: IWAArchiveInfo[] = [], ptr: Ptr = [0];
while(ptr[0] < buf.length) {
/* .TSP.ArchiveInfo */
var len = parse_varint49(buf, ptr);
2022-07-13 07:52:29 +00:00
var ai = parse_shallow(buf[subarray](ptr[0], ptr[0] + len));
ptr[0] += len;
var res: IWAArchiveInfo = {
/* TODO: technically ID is optional */
id: varint_to_i32(ai[1][0].data),
messages: []
};
ai[2].forEach(b => {
var mi = parse_shallow(b.data);
var fl = varint_to_i32(mi[3][0].data);
res.messages.push({
meta: mi,
2022-07-13 07:52:29 +00:00
data: buf[subarray](ptr[0], ptr[0] + fl)
});
ptr[0] += fl;
});
if(ai[3]?.[0]) res.merge = (varint_to_i32(ai[3][0].data) >>> 0) > 0;
out.push(res);
}
return out;
}
2022-04-11 04:11:47 +00:00
/** Generate an IWA file from a parsed structure */
function write_iwa_file(ias: IWAArchiveInfo[]): Uint8Array {
var bufs: Uint8Array[] = [];
ias.forEach(ia => {
2022-03-25 00:12:55 +00:00
var ai: ProtoMessage = [ [],
[ {data: write_varint49(ia.id), type: 0} ],
[]
];
if(ia.merge != null) ai[3] = [ { data: write_varint49(+!!ia.merge), type: 0 } ];
var midata: Uint8Array[] = [];
ia.messages.forEach(mi => {
midata.push(mi.data);
mi.meta[3] = [ { type: 0, data: write_varint49(mi.data.length) } ];
ai[2].push({data: write_shallow(mi.meta), type: 2});
});
var aipayload = write_shallow(ai);
bufs.push(write_varint49(aipayload.length));
bufs.push(aipayload);
midata.forEach(mid => bufs.push(mid));
});
return u8concat(bufs);
}
//<<export { IWAMessage, IWAArchiveInfo, parse_iwa_file, write_iwa_file };
2022-03-21 01:39:16 +00:00
/** Decompress a snappy chunk */
2022-07-13 07:52:29 +00:00
function parse_snappy_chunk(type: number, buf: Uint8Array): Uint8Array[] {
if(type != 0) throw new Error(`Unexpected Snappy chunk type ${type}`);
var ptr: Ptr = [0];
var usz = parse_varint49(buf, ptr);
2022-07-08 22:31:08 +00:00
var chunks: Uint8Array[] = [];
while(ptr[0] < buf.length) {
var tag = buf[ptr[0]] & 0x3;
if(tag == 0) {
var len = buf[ptr[0]++] >> 2;
if(len < 60) ++len;
else {
var c = len - 59;
len = buf[ptr[0]];
if(c > 1) len |= (buf[ptr[0]+1]<<8);
if(c > 2) len |= (buf[ptr[0]+2]<<16);
if(c > 3) len |= (buf[ptr[0]+3]<<24);
len >>>=0; len++;
ptr[0] += c;
}
2022-07-13 07:52:29 +00:00
chunks.push(buf[subarray](ptr[0], ptr[0] + len)); ptr[0] += len; continue;
} else {
var offset = 0, length = 0;
if(tag == 1) {
length = ((buf[ptr[0]] >> 2) & 0x7) + 4;
offset = (buf[ptr[0]++] & 0xE0) << 3;
offset |= buf[ptr[0]++];
} else {
length = (buf[ptr[0]++] >> 2) + 1;
if(tag == 2) { offset = buf[ptr[0]] | (buf[ptr[0]+1]<<8); ptr[0] += 2; }
else { offset = (buf[ptr[0]] | (buf[ptr[0]+1]<<8) | (buf[ptr[0]+2]<<16) | (buf[ptr[0]+3]<<24))>>>0; ptr[0] += 4; }
}
if(offset == 0) throw new Error("Invalid offset 0");
2022-07-13 07:52:29 +00:00
var j = chunks.length - 1, off = offset;
while(j >=0 && off >= chunks[j].length) { off -= chunks[j].length; --j; }
if(j < 0) {
if(off == 0) off = chunks[(j = 0)].length;
else throw new Error("Invalid offset beyond length");
}
2022-07-16 22:07:53 +00:00
// Node 0.8 Buffer slice does not support negative indices
if(length < off) chunks.push(chunks[j][subarray](chunks[j].length-off, chunks[j].length-off + length));
2022-07-13 07:52:29 +00:00
else {
2022-07-16 22:07:53 +00:00
if(off > 0) { chunks.push(chunks[j][subarray](chunks[j].length-off)); length -= off; } ++j;
2022-07-13 07:52:29 +00:00
while(length >= chunks[j].length) { chunks.push(chunks[j]); length -= chunks[j].length; ++j; }
if(length) chunks.push(chunks[j][subarray](0, length));
}
2022-07-13 07:52:29 +00:00
if(chunks.length > 100) chunks = [u8concat(chunks)];
}
}
2022-07-13 07:52:29 +00:00
if(chunks.reduce((acc, u8) => acc + u8.length, 0) != usz) throw new Error(`Unexpected length: ${chunks.reduce((acc, u8) => acc + u8.length, 0)} != ${usz}`);
return chunks;
//var o = u8concat(chunks);
//if(o.length != usz) throw new Error(`Unexpected length: ${o.length} != ${usz}`);
//return o;
}
2022-03-21 01:39:16 +00:00
/** Decompress IWA file */
function decompress_iwa_file(buf: Uint8Array): Uint8Array {
2022-07-13 07:52:29 +00:00
if(Array.isArray(buf)) buf = new Uint8Array(buf);
2022-07-08 22:31:08 +00:00
var out: Uint8Array[] = [];
var l = 0;
while(l < buf.length) {
var t = buf[l++];
var len = buf[l] | (buf[l+1]<<8) | (buf[l+2] << 16); l += 3;
2022-07-13 07:52:29 +00:00
out.push.apply(out, parse_snappy_chunk(t, buf[subarray](l, l + len)));
l += len;
}
if(l !== buf.length) throw new Error("data is not a valid framed stream!");
return u8concat(out);
}
2022-03-21 01:39:16 +00:00
/** Compress IWA file */
function compress_iwa_file(buf: Uint8Array): Uint8Array {
var out: Uint8Array[] = [];
var l = 0;
while(l < buf.length) {
var c = Math.min(buf.length - l, 0xFFFFFFF);
var frame = new Uint8Array(4);
out.push(frame);
var usz = write_varint49(c);
var L = usz.length;
out.push(usz);
if(c <= 60) { L++; out.push(new Uint8Array([(c - 1)<<2])); }
else if(c <= 0x100) { L += 2; out.push(new Uint8Array([0xF0, (c-1) & 0xFF])); }
else if(c <= 0x10000) { L += 3; out.push(new Uint8Array([0xF4, (c-1) & 0xFF, ((c-1) >> 8) & 0xFF])); }
else if(c <= 0x1000000) { L += 4; out.push(new Uint8Array([0xF8, (c-1) & 0xFF, ((c-1) >> 8) & 0xFF, ((c-1) >> 16) & 0xFF])); }
else if(c <= 0x100000000) { L += 5; out.push(new Uint8Array([0xFC, (c-1) & 0xFF, ((c-1) >> 8) & 0xFF, ((c-1) >> 16) & 0xFF, ((c-1) >>> 24) & 0xFF])); }
2022-07-13 07:52:29 +00:00
out.push(buf[subarray](l, l + c)); L += c;
2022-03-21 01:39:16 +00:00
frame[0] = 0;
frame[1] = L & 0xFF; frame[2] = (L >> 8) & 0xFF; frame[3] = (L >> 16) & 0xFF;
l += c;
}
return u8concat(out);
}
//<<export { decompress_iwa_file, compress_iwa_file };
2022-09-04 21:51:49 +00:00
/** .TST.DataStore */
interface DataLUT {
/** shared string table */
sst: string[];
/** rich string table table */
rsst: string[];
/** old format table */
ofmt: ProtoMessage[];
/** new format table */
nfmt: ProtoMessage[];
}
var numbers_lut_new = (): DataLUT => ({ sst: [], rsst: [], ofmt: [], nfmt: [] });
function numbers_format_cell(cell: CellObject, t: number, flags: number, ofmt: ProtoMessage, nfmt: ProtoMessage): void {
var ctype = t & 0xFF, ver = t >> 8;
var fmt = ver >= 5 ? nfmt : ofmt;
dur: if((flags & (ver > 4 ? 8: 4)) && cell.t == "n" && ctype == 7) {
var dstyle = (fmt[7]?.[0]) ? parse_varint49(fmt[7][0].data) : -1;
if(dstyle == -1) break dur;
var dmin = (fmt[15]?.[0]) ? parse_varint49(fmt[15][0].data) : -1;
var dmax = (fmt[16]?.[0]) ? parse_varint49(fmt[16][0].data) : -1;
var auto = (fmt[40]?.[0]) ? parse_varint49(fmt[40][0].data) : -1;
var d: number = cell.v as number, dd = d;
autodur: if(auto) { // TODO: check if numbers reformats on load
if(d == 0) { dmin = dmax = 2; break autodur; }
if(d >= 604800) dmin = 1;
else if(d >= 86400) dmin = 2;
else if(d >= 3600) dmin = 4;
else if(d >= 60) dmin = 8;
else if(d >= 1) dmin = 16;
else dmin = 32;
if(Math.floor(d) != d) dmax = 32;
else if(d % 60) dmax = 16;
else if(d % 3600) dmax = 8;
else if(d % 86400) dmax = 4;
else if(d % 604800) dmax = 2;
if(dmax < dmin) dmax = dmin;
}
if(dmin == -1 || dmax == -1) break dur;
var dstr: string[] = [], zstr: string[] = [];
/* TODO: plurality, SSF equivalents */
if(dmin == 1) {
dd = d / 604800;
if(dmax == 1) { zstr.push('d"d"'); } else { dd |= 0; d -= 604800 * dd; }
dstr.push(dd + (dstyle == 2 ? " week" + (dd == 1 ? "" : "s") : dstyle == 1 ? "w": ""));
}
if(dmin <= 2 && dmax >= 2) {
dd = d / 86400;
if(dmax > 2) { dd |= 0; d -= 86400 * dd; }
zstr.push("d" + '"d"');
dstr.push(dd + (dstyle == 2 ? " day" + (dd == 1 ? "" : "s") : dstyle == 1 ? "d" : ""));
}
if(dmin <= 4 && dmax >= 4) {
dd = d / 3600;
if(dmax > 4) { dd |= 0; d -= 3600 * dd; }
zstr.push((dmin >= 4 ? "[h]" : "h") + '"h"');
dstr.push(dd + (dstyle == 2 ? " hour" + (dd == 1 ? "" : "s") : dstyle == 1 ? "h" : ""));
}
if(dmin <= 8 && dmax >= 8) {
dd = d / 60;
if(dmax > 8) { dd |= 0; d -= 60 * dd; }
zstr.push((dmin >= 8 ? "[m]" : "m") + '"m"');
if(dstyle == 0) dstr.push(((dmin == 8 && dmax == 8 || dd >= 10) ? "" : "0") + dd);
2022-09-04 21:51:49 +00:00
else dstr.push(dd + (dstyle == 2 ? " minute" + (dd == 1 ? "" : "s") : dstyle == 1 ? "m" : ""));
}
if(dmin <= 16 && dmax >= 16) {
dd = d;
if(dmax > 16) { dd |= 0; d -= dd; }
zstr.push((dmin >= 16 ? "[s]" : "s") + '"s"');
if(dstyle == 0) dstr.push((dmax == 16 && dmin == 16 || dd >= 10 ? "" : "0") + dd);
2022-09-04 21:51:49 +00:00
else dstr.push(dd + (dstyle == 2 ? " second" + (dd == 1 ? "" : "s") : dstyle == 1 ? "s" : ""));
}
if(dmax >= 32) {
dd = Math.round(1000 * d);
if(dmin < 32) zstr.push(".000" + '"ms"');
if(dstyle == 0) dstr.push((dd >= 100 ? "" : dd >= 10 ? "0" : "00") + dd);
2022-09-04 21:51:49 +00:00
else dstr.push(dd + (dstyle == 2 ? " millisecond" + (dd == 1 ? "" : "s") : dstyle == 1 ? "ms" : ""));
}
cell.w = dstr.join(dstyle == 0 ? ":" : " "); cell.z = zstr.join(dstyle == 0 ? '":"': " ");
if(dstyle == 0) cell.w = cell.w.replace(/:(\d\d\d)$/, ".$1");
}
}
/** Parse "old storage" (version 0..4) */
function parse_old_storage(buf: Uint8Array, lut: DataLUT, v: 0|1|2|3|4): CellObject | void {
2022-03-25 00:12:55 +00:00
var dv = u8_to_dataview(buf);
2022-03-21 01:39:16 +00:00
var flags = dv.getUint32(4, true);
2022-09-04 21:51:49 +00:00
var ridx = -1, sidx = -1, zidx = -1, ieee = NaN, dt = new Date(2001, 0, 1);
var doff = (v > 1 ? 12 : 8);
if(flags & 0x0002) { zidx = dv.getUint32(doff, true); doff += 4;}
doff += popcnt(flags & (v > 1 ? 0x0D8C : 0x018C)) * 4;
if(flags & 0x0200) { ridx = dv.getUint32(doff, true); doff += 4; }
doff += popcnt(flags & (v > 1 ? 0x3000 : 0x1000)) * 4;
if(flags & 0x0010) { sidx = dv.getUint32(doff, true); doff += 4; }
if(flags & 0x0020) { ieee = dv.getFloat64(doff, true); doff += 8; }
if(flags & 0x0040) { dt.setTime(dt.getTime() + dv.getFloat64(doff, true) * 1000); doff += 8; }
if(v > 1) {
flags = dv.getUint32(8, true) >>> 16;
/* TODO: stress test if a cell can have multiple sub-type formats */
if(flags & 0xFF) { if(zidx == -1) zidx = dv.getUint32(doff, true); doff += 4; }
}
2022-03-25 00:12:55 +00:00
var ret: CellObject;
2022-09-04 21:51:49 +00:00
var t = buf[v >= 4 ? 1 : 2];
switch(t) {
2022-07-08 22:31:08 +00:00
case 0: return void 0; // return { t: "z" }; // blank?
2022-03-25 00:12:55 +00:00
case 2: ret = { t: "n", v: ieee }; break; // number
2022-09-04 21:51:49 +00:00
case 3: ret = { t: "s", v: lut.sst[sidx] }; break; // string
2022-03-25 00:12:55 +00:00
case 5: ret = { t: "d", v: dt }; break; // date-time
case 6: ret = { t: "b", v: ieee > 0 }; break; // boolean
2022-09-04 21:51:49 +00:00
case 7: ret = { t: "n", v: ieee }; break; // duration in seconds
2022-03-25 00:12:55 +00:00
case 8: ret = { t: "e", v: 0}; break; // "formula error" TODO: enumerate and map errors to csf equivalents
2022-04-11 04:11:47 +00:00
case 9: { // "rich text"
2022-09-04 21:51:49 +00:00
if(ridx > -1) ret = { t: "s", v: lut.rsst[ridx] };
2022-07-13 07:52:29 +00:00
else throw new Error(`Unsupported cell type ${buf[subarray](0,4)}`);
2022-03-25 00:12:55 +00:00
} break;
2022-07-13 07:52:29 +00:00
default: throw new Error(`Unsupported cell type ${buf[subarray](0,4)}`);
2022-03-25 00:12:55 +00:00
}
2022-09-04 21:51:49 +00:00
if(zidx > -1) numbers_format_cell(ret, t | (v<<8), flags, lut.ofmt[zidx], lut.nfmt[zidx]);
if(t == 7) (ret.v as number) /= 86400;
2022-03-25 00:12:55 +00:00
return ret;
}
/** Parse "new storage" (version 5) */
2022-09-04 21:51:49 +00:00
function parse_new_storage(buf: Uint8Array, lut: DataLUT): CellObject | void {
2022-03-25 00:12:55 +00:00
var dv = u8_to_dataview(buf);
// TODO: bytes 2:3 appear to be unused?
var flags = dv.getUint32(4, true);
var fields = dv.getUint32(8, true);
2022-09-04 21:51:49 +00:00
var doff = 12;
var ridx = -1, sidx = -1, zidx = -1, d128 = NaN, ieee = NaN, dt = new Date(2001, 0, 1);
// 0x00001F data
if(fields & 0x000001) { d128 = readDecimal128LE(buf, doff); doff += 16; }
if(fields & 0x000002) { ieee = dv.getFloat64(doff, true); doff += 8; }
if(fields & 0x000004) { dt.setTime(dt.getTime() + dv.getFloat64(doff, true) * 1000); doff += 8; }
if(fields & 0x000008) { sidx = dv.getUint32(doff, true); doff += 4; }
if(fields & 0x000010) { ridx = dv.getUint32(doff, true); doff += 4; }
2022-03-25 00:12:55 +00:00
var ret: CellObject;
2022-09-04 21:51:49 +00:00
var t = buf[1];
switch(t) {
case 0: return void 0; // return { t: "z" }; // blank?
case 2: ret = { t: "n", v: d128 }; break; // number
case 3: ret = { t: "s", v: lut.sst[sidx] }; break; // string
case 5: ret = { t: "d", v: dt }; break; // date-time
case 6: ret = { t: "b", v: ieee > 0 }; break; // boolean
case 7: ret = { t: "n", v: ieee }; break; // duration in "s", fixed later
case 8: ret = { t: "e", v: 0 }; break; // "formula error" TODO: enumerate and map errors to csf equivalents
case 9: ret = { t: "s", v: lut.rsst[ridx] }; break;// "rich text"
2022-03-25 00:12:55 +00:00
case 10: ret = { t: "n", v: d128 }; break; // currency
default: throw new Error(`Unsupported cell type ${buf[1]} : ${fields & 0x1F} : ${buf[subarray](0,4)}`);
2022-03-25 00:12:55 +00:00
}
// 0x0001E0 styling
// 0x000E00 formula
// 0x001000 something related to cell format
doff += popcnt(fields & 0x001FE0) * 4;
/* TODO: stress test if a cell can have multiple sub-type formats */
// 0x07E000 formats
if(fields & 0x07E000) { if(zidx == -1) zidx = dv.getUint32(doff, true); doff += 4; }
// 0x080000 comment
// 0x100000 warning
if(zidx > -1) numbers_format_cell(ret, t | (5<<8), fields >> 13, lut.ofmt[zidx], lut.nfmt[zidx] );
if(t == 7) (ret.v as number) /= 86400; // duration -> SheetJS absolute time
2022-03-25 00:12:55 +00:00
return ret;
}
2022-04-11 04:11:47 +00:00
/** Write a cell "new storage" (version 5) */
function write_new_storage(cell: CellObject, sst: string[]): Uint8Array {
var out = new Uint8Array(32), dv = u8_to_dataview(out), l = 12, flags = 0;
out[0] = 5;
switch(cell.t) {
case "n": out[1] = 2; writeDecimal128LE(out, l, cell.v as number); flags |= 1; l += 16; break;
case "b": out[1] = 6; dv.setFloat64(l, cell.v ? 1 : 0, true); flags |= 2; l += 8; break;
case "s":
if(sst.indexOf(cell.v as string) == -1) throw new Error(`Value ${cell.v} missing from SST!`);
out[1] = 3; dv.setUint32(l, sst.indexOf(cell.v as string), true); flags |= 8; l += 4; break;
default: throw "unsupported cell type " + cell.t;
}
dv.setUint32(8, flags, true);
2022-07-13 07:52:29 +00:00
return out[subarray](0, l);
}
/** Write a cell "old storage" (version 4) */
function write_old_storage(cell: CellObject, sst: string[]): Uint8Array {
var out = new Uint8Array(32), dv = u8_to_dataview(out), l = 12, flags = 0;
out[0] = 4;
switch(cell.t) {
case "n": out[2] = 2; dv.setFloat64(l, cell.v as number, true); flags |= 0x20; l += 8; break;
case "b": out[2] = 6; dv.setFloat64(l, cell.v ? 1 : 0, true); flags |= 0x20; l += 8; break;
case "s":
if(sst.indexOf(cell.v as string) == -1) throw new Error(`Value ${cell.v} missing from SST!`);
out[2] = 3; dv.setUint32(l, sst.indexOf(cell.v as string), true); flags |= 0x10; l += 4; break;
default: throw "unsupported cell type " + cell.t;
}
dv.setUint32(8, flags, true);
2022-07-13 07:52:29 +00:00
return out[subarray](0, l);
}
//<<export { write_new_storage, write_old_storage };
2022-09-04 21:51:49 +00:00
function parse_cell_storage(buf: Uint8Array, lut: DataLUT): CellObject | void {
2022-03-25 00:12:55 +00:00
switch(buf[0]) {
case 0: case 1:
2022-09-04 21:51:49 +00:00
case 2: case 3: case 4: return parse_old_storage(buf, lut, buf[0]);
case 5: return parse_new_storage(buf, lut);
2022-03-25 00:12:55 +00:00
default: throw new Error(`Unsupported payload version ${buf[0]}`);
}
}
2022-03-21 01:39:16 +00:00
/** .TSS.StylesheetArchive */
//function parse_TSS_StylesheetArchive(M: IWAMessage[][], root: IWAMessage): void {
// var pb = parse_shallow(root.data);
//}
2022-04-11 04:11:47 +00:00
/** Parse .TSP.Reference */
function parse_TSP_Reference(buf: Uint8Array): number {
var pb = parse_shallow(buf);
return parse_varint49(pb[1][0].data);
}
2022-04-11 04:11:47 +00:00
/** Write .TSP.Reference */
function write_TSP_Reference(idx: number): Uint8Array {
2022-03-25 00:12:55 +00:00
return write_shallow([
[],
[ { type: 0, data: write_varint49(idx) } ]
]);
}
//<<export { parse_TSP_Reference, write_TSP_Reference };
2022-03-21 01:39:16 +00:00
type MessageSpace = {[id: number]: IWAMessage[]};
2022-04-11 04:11:47 +00:00
/** Parse .TST.TableDataList */
2022-09-04 21:51:49 +00:00
function parse_TST_TableDataList(M: MessageSpace, root: IWAMessage): any[] {
var pb = parse_shallow(root.data);
// .TST.TableDataList.ListType
var type = varint_to_i32(pb[1][0].data);
var entries = pb[3];
2022-09-04 21:51:49 +00:00
var data: any[] = [];
(entries||[]).forEach(entry => {
// .TST.TableDataList.ListEntry
var le = parse_shallow(entry.data);
var key = varint_to_i32(le[1][0].data)>>>0;
switch(type) {
case 1: data[key] = u8str(le[3][0].data); break;
case 8: {
// .TSP.RichTextPayloadArchive
var rt = M[parse_TSP_Reference(le[9][0].data)][0];
var rtp = parse_shallow(rt.data);
// .TSWP.StorageArchive
var rtpref = M[parse_TSP_Reference(rtp[1][0].data)][0];
var mtype = varint_to_i32(rtpref.meta[1][0].data);
if(mtype != 2001) throw new Error(`2000 unexpected reference to ${mtype}`);
var tswpsa = parse_shallow(rtpref.data);
data[key] = tswpsa[3].map(x => u8str(x.data)).join("");
} break;
2022-09-04 21:51:49 +00:00
case 2: data[key] = parse_shallow(le[6][0].data); break;
default: throw type;
}
});
return data;
}
2022-03-21 01:39:16 +00:00
type TileStorageType = -1 | 0 | 1;
interface TileRowInfo {
2022-03-21 01:39:16 +00:00
/** Row Index */
R: number;
2022-03-21 01:39:16 +00:00
/** Cell Storage */
2022-07-08 22:31:08 +00:00
cells: Uint8Array[];
}
2022-04-11 04:11:47 +00:00
/** Parse .TSP.TileRowInfo */
2022-03-21 01:39:16 +00:00
function parse_TST_TileRowInfo(u8: Uint8Array, type: TileStorageType): TileRowInfo {
var pb = parse_shallow(u8);
var R = varint_to_i32(pb[1][0].data) >>> 0;
2022-03-21 01:39:16 +00:00
var cnt = varint_to_i32(pb[2][0].data) >>> 0;
// var version = pb?.[5]?.[0] && (varint_to_i32(pb[5][0].data) >>> 0);
var wide_offsets = pb[8]?.[0]?.data && varint_to_i32(pb[8][0].data) > 0 || false;
2022-03-21 01:39:16 +00:00
/* select storage by type (1 = modern / 0 = old / -1 = try modern, old) */
var used_storage_u8: Uint8Array, used_storage: Uint8Array;
if(pb[7]?.[0]?.data && type != 0) { used_storage_u8 = pb[7]?.[0]?.data; used_storage = pb[6]?.[0]?.data; }
else if(pb[4]?.[0]?.data && type != 1) { used_storage_u8 = pb[4]?.[0]?.data; used_storage = pb[3]?.[0]?.data; }
else throw `NUMBERS Tile missing ${type} cell storage`;
/* find all offsets -- 0xFFFF means cells are not present */
var width = wide_offsets ? 4 : 1;
2022-03-21 01:39:16 +00:00
var used_storage_offsets = u8_to_dataview(used_storage_u8);
var offsets: Array<[number, number]> = [];
for(var C = 0; C < used_storage_u8.length / 2; ++C) {
var off = used_storage_offsets.getUint16(C*2, true);
if(off < 65535) offsets.push([C, off]);
}
2022-03-21 01:39:16 +00:00
if(offsets.length != cnt) throw `Expected ${cnt} cells, found ${offsets.length}`;
var cells: Uint8Array[] = [];
2022-07-13 07:52:29 +00:00
for(C = 0; C < offsets.length - 1; ++C) cells[offsets[C][0]] = used_storage[subarray](offsets[C][1] * width, offsets[C+1][1] * width);
if(offsets.length >= 1) cells[offsets[offsets.length - 1][0]] = used_storage[subarray](offsets[offsets.length - 1][1] * width);
return { R, cells };
}
2022-03-21 01:39:16 +00:00
interface TileInfo {
data: Uint8Array[][];
nrows: number;
}
2022-04-11 04:11:47 +00:00
/** Parse .TST.Tile */
2022-03-21 01:39:16 +00:00
function parse_TST_Tile(M: MessageSpace, root: IWAMessage): TileInfo {
var pb = parse_shallow(root.data);
// ESBuild issue 2136
// var storage: TileStorageType = (pb?.[7]?.[0]) ? ((varint_to_i32(pb[7][0].data)>>>0) > 0 ? 1 : 0 ) : -1;
var storage: TileStorageType = -1;
if(pb?.[7]?.[0]) { if(varint_to_i32(pb[7][0].data)>>>0) storage = 1; else storage = 0; }
2022-03-21 01:39:16 +00:00
var ri = mappa(pb[5], (u8: Uint8Array) => parse_TST_TileRowInfo(u8, storage));
return {
nrows: varint_to_i32(pb[4][0].data)>>>0,
data: ri.reduce((acc, x) => {
if(!acc[x.R]) acc[x.R] = [];
x.cells.forEach((cell, C) => {
if(acc[x.R][C]) throw new Error(`Duplicate cell r=${x.R} c=${C}`);
acc[x.R][C] = cell;
});
return acc;
}, [] as Uint8Array[][])
};
}
2022-04-11 04:11:47 +00:00
/** Parse .TST.TableModelArchive (6001) */
2022-03-21 01:39:16 +00:00
function parse_TST_TableModelArchive(M: MessageSpace, root: IWAMessage, ws: WorkSheet) {
var pb = parse_shallow(root.data);
var range: Range = { s: {r:0, c:0}, e: {r:0, c:0} };
range.e.r = (varint_to_i32(pb[6][0].data) >>> 0) - 1;
if(range.e.r < 0) throw new Error(`Invalid row varint ${pb[6][0].data}`);
range.e.c = (varint_to_i32(pb[7][0].data) >>> 0) - 1;
if(range.e.c < 0) throw new Error(`Invalid col varint ${pb[7][0].data}`);
ws["!ref"] = encode_range(range);
2022-07-13 07:52:29 +00:00
var dense = Array.isArray(ws);
2022-03-21 01:39:16 +00:00
// .TST.DataStore
var store = parse_shallow(pb[4][0].data);
2022-09-04 21:51:49 +00:00
var lut: DataLUT = numbers_lut_new();
if(store[4]?.[0]) lut.sst = parse_TST_TableDataList(M, M[parse_TSP_Reference(store[4][0].data)][0]);
if(store[11]?.[0]) lut.ofmt = parse_TST_TableDataList(M, M[parse_TSP_Reference(store[11][0].data)][0]);
if(store[17]?.[0]) lut.rsst = parse_TST_TableDataList(M, M[parse_TSP_Reference(store[17][0].data)][0]);
if(store[22]?.[0]) lut.nfmt = parse_TST_TableDataList(M, M[parse_TSP_Reference(store[22][0].data)][0]);
2022-03-21 01:39:16 +00:00
// .TST.TileStorage
var tile = parse_shallow(store[3][0].data);
var _R = 0;
/* TODO: should this list be sorted by id ? */
tile[1].forEach(t => {
var tl = (parse_shallow(t.data));
// var id = varint_to_i32(tl[1][0].data);
var ref = M[parse_TSP_Reference(tl[2][0].data)][0];
var mtype = varint_to_i32(ref.meta[1][0].data);
if(mtype != 6002) throw new Error(`6001 unexpected reference to ${mtype}`);
var _tile = parse_TST_Tile(M, ref);
_tile.data.forEach((row, R) => {
row.forEach((buf, C) => {
2022-09-04 21:51:49 +00:00
var res = parse_cell_storage(buf, lut);
2022-07-13 07:52:29 +00:00
if(res) {
if(dense) {
if(!ws[_R + R]) ws[_R + R] = [];
ws[_R + R][C] = res;
} else {
var addr = encode_cell({r:_R + R,c:C});
ws[addr] = res;
}
}
});
2022-03-21 01:39:16 +00:00
});
_R += _tile.nrows;
});
2022-03-26 21:50:27 +00:00
if(store[13]?.[0]) {
var ref = M[parse_TSP_Reference(store[13][0].data)][0];
var mtype = varint_to_i32(ref.meta[1][0].data);
if(mtype != 6144) throw new Error(`Expected merge type 6144, found ${mtype}`);
ws["!merges"] = parse_shallow(ref.data)?.[1].map(pi => {
var merge = parse_shallow(pi.data);
var origin = u8_to_dataview(parse_shallow(merge[1][0].data)[1][0].data), size = u8_to_dataview(parse_shallow(merge[2][0].data)[1][0].data);
return {
s: { r: origin.getUint16(0, true), c: origin.getUint16(2, true) },
e: {
r: origin.getUint16(0, true) + size.getUint16(0, true) - 1,
c: origin.getUint16(2, true) + size.getUint16(2, true) - 1
}
};
});
}
}
2022-04-11 04:11:47 +00:00
/** Parse .TST.TableInfoArchive (6000) */
2022-07-13 07:52:29 +00:00
function parse_TST_TableInfoArchive(M: MessageSpace, root: IWAMessage, opts?: ParsingOptions): WorkSheet {
var pb = parse_shallow(root.data);
2022-07-13 07:52:29 +00:00
// ESBuild #2375
var out: WorkSheet;
if(!opts?.dense) out = ({ "!ref": "A1" });
else out = ([] as any);
out["!ref"] = "A1";
var tableref = M[parse_TSP_Reference(pb[2][0].data)];
var mtype = varint_to_i32(tableref[0].meta[1][0].data);
if(mtype != 6001) throw new Error(`6000 unexpected reference to ${mtype}`);
parse_TST_TableModelArchive(M, tableref[0], out);
return out;
}
interface NSheet {
name: string;
sheets: WorkSheet[];
}
2022-04-11 04:11:47 +00:00
/** Parse .TN.SheetArchive (2) */
2022-07-13 07:52:29 +00:00
function parse_TN_SheetArchive(M: MessageSpace, root: IWAMessage, opts?: ParsingOptions): NSheet {
var pb = parse_shallow(root.data);
var out: NSheet = {
name: (pb[1]?.[0] ? u8str(pb[1][0].data) : ""),
sheets: []
};
var shapeoffs = mappa(pb[2], parse_TSP_Reference);
shapeoffs.forEach((off) => {
M[off].forEach((m: IWAMessage) => {
var mtype = varint_to_i32(m.meta[1][0].data);
2022-07-13 07:52:29 +00:00
if(mtype == 6000) out.sheets.push(parse_TST_TableInfoArchive(M, m, opts));
});
});
return out;
}
2022-04-11 04:11:47 +00:00
/** Parse .TN.DocumentArchive */
2022-07-13 07:52:29 +00:00
function parse_TN_DocumentArchive(M: MessageSpace, root: IWAMessage, opts?: ParsingOptions): WorkBook {
var out = book_new();
var pb = parse_shallow(root.data);
2022-03-26 21:50:27 +00:00
if(pb[2]?.[0]) throw new Error("Keynote presentations are not supported");
2022-03-21 01:39:16 +00:00
// var stylesheet = mappa(pb[4], parse_TSP_Reference)[0];
// if(varint_to_i32(M[stylesheet][0].meta[1][0].data) == 401) parse_TSS_StylesheetArchive(M, M[stylesheet][0]);
// var sidebar = mappa(pb[5], parse_TSP_Reference);
// var theme = mappa(pb[6], parse_TSP_Reference);
// var docinfo = parse_shallow(pb[8][0].data);
// var tskinfo = parse_shallow(docinfo[1][0].data);
// var author_storage = mappa(tskinfo[7], parse_TSP_Reference);
var sheetoffs = mappa(pb[1], parse_TSP_Reference);
sheetoffs.forEach((off) => {
M[off].forEach((m: IWAMessage) => {
var mtype = varint_to_i32(m.meta[1][0].data);
if(mtype == 2) {
2022-07-13 07:52:29 +00:00
var root = parse_TN_SheetArchive(M, m, opts);
2022-03-21 01:39:16 +00:00
root.sheets.forEach((sheet, idx) => { book_append_sheet(out, sheet, idx == 0 ? root.name : root.name + "_" + idx, true); });
}
});
});
if(out.SheetNames.length == 0) throw new Error("Empty NUMBERS file");
2022-07-08 22:31:08 +00:00
out.bookType = "numbers";
return out;
}
2022-03-21 01:39:16 +00:00
/** Parse NUMBERS file */
2022-07-13 07:52:29 +00:00
function parse_numbers_iwa(cfb: CFB$Container, opts?: ParsingOptions ): WorkBook {
var M: MessageSpace = {}, indices: number[] = [];
cfb.FullPaths.forEach(p => { if(p.match(/\.iwpv2/)) throw new Error(`Unsupported password protection`); });
2022-03-21 01:39:16 +00:00
/* collect entire message space */
cfb.FileIndex.forEach(s => {
if(!s.name.match(/\.iwa$/)) return;
2022-07-31 23:48:02 +00:00
if(s.content[0] == 98) return; // TODO: OperationStorage.iwa
var o: Uint8Array;
2022-03-21 01:39:16 +00:00
try { o = decompress_iwa_file(s.content as Uint8Array); } catch(e) { return console.log("?? " + s.content.length + " " + (e.message || e)); }
var packets: IWAArchiveInfo[];
try { packets = parse_iwa_file(o); } catch(e) { return console.log("## " + (e.message || e)); }
packets.forEach(packet => { M[packet.id] = packet.messages; indices.push(packet.id); });
});
2022-03-21 01:39:16 +00:00
if(!indices.length) throw new Error("File has no messages");
/* find document root */
2022-03-26 21:50:27 +00:00
if(M?.[1]?.[0]?.meta?.[1]?.[0].data && varint_to_i32(M[1][0].meta[1][0].data) == 10000) throw new Error("Pages documents are not supported");
2022-07-08 22:31:08 +00:00
var docroot: IWAMessage | false = M?.[1]?.[0]?.meta?.[1]?.[0].data && varint_to_i32(M[1][0].meta[1][0].data) == 1 && M[1][0];
2022-03-21 01:39:16 +00:00
if(!docroot) indices.forEach((idx) => {
M[idx].forEach((iwam) => {
var mtype = varint_to_i32(iwam.meta[1][0].data) >>> 0;
if(mtype == 1) {
if(!docroot) docroot = iwam;
else throw new Error("Document has multiple roots");
}
});
});
if(!docroot) throw new Error("Cannot find Document root");
2022-07-13 07:52:29 +00:00
return parse_TN_DocumentArchive(M, docroot, opts);
}
2022-03-21 01:39:16 +00:00
//<<export { parse_numbers_iwa };
interface DependentInfo {
2022-03-25 00:12:55 +00:00
deps: number[];
location: string;
type: number;
}
2022-04-11 04:11:47 +00:00
/** Write .TST.TileRowInfo */
function write_tile_row(tri: ProtoMessage, data: any[], SST: string[], wide: boolean): number {
2022-03-25 00:12:55 +00:00
if(!tri[6]?.[0] || !tri[7]?.[0]) throw "Mutation only works on post-BNC storages!";
2022-04-11 04:11:47 +00:00
//var wide_offsets = tri[8]?.[0]?.data && varint_to_i32(tri[8][0].data) > 0 || false;
var cnt = 0;
2022-04-11 04:11:47 +00:00
if(tri[7][0].data.length < 2 * data.length) {
var new_7 = new Uint8Array(2 * data.length);
new_7.set(tri[7][0].data);
tri[7][0].data = new_7;
}
//if(wide) {
// tri[3] = [{type: 2, data: new Uint8Array([240, 159, 164, 160]) }];
// tri[4] = [{type: 2, data: new Uint8Array([240, 159, 164, 160]) }];
/* } else*/ if(tri[4][0].data.length < 2 * data.length) {
var new_4 = new Uint8Array(2 * data.length);
new_4.set(tri[4][0].data);
tri[4][0].data = new_4;
}
2022-03-25 00:12:55 +00:00
var dv = u8_to_dataview(tri[7][0].data), last_offset = 0, cell_storage: Uint8Array[] = [];
var _dv = u8_to_dataview(tri[4][0].data), _last_offset = 0, _cell_storage: Uint8Array[] = [];
2022-04-11 04:11:47 +00:00
var width = wide ? 4 : 1;
for(var C = 0; C < data.length; ++C) {
if(data[C] == null) { dv.setUint16(C*2, 0xFFFF, true); _dv.setUint16(C*2, 0xFFFF); continue; }
2022-04-11 04:11:47 +00:00
dv.setUint16(C*2, last_offset / width, true);
/*if(!wide)*/ _dv.setUint16(C*2, _last_offset / width, true);
var celload: Uint8Array, _celload: Uint8Array;
switch(typeof data[C]) {
case "string":
celload = write_new_storage({t: "s", v: data[C]}, SST);
2022-04-11 04:11:47 +00:00
/*if(!wide)*/ _celload = write_old_storage({t: "s", v: data[C]}, SST);
break;
case "number":
celload = write_new_storage({t: "n", v: data[C]}, SST);
2022-04-11 04:11:47 +00:00
/*if(!wide)*/ _celload = write_old_storage({t: "n", v: data[C]}, SST);
break;
case "boolean":
celload = write_new_storage({t: "b", v: data[C]}, SST);
2022-04-11 04:11:47 +00:00
/*if(!wide)*/ _celload = write_old_storage({t: "b", v: data[C]}, SST);
break;
default: throw new Error("Unsupported value " + data[C]);
}
cell_storage.push(celload); last_offset += celload.length;
2022-04-11 04:11:47 +00:00
/*if(!wide)*/ { _cell_storage.push(_celload); _last_offset += _celload.length; }
++cnt;
}
tri[2][0].data = write_varint49(cnt);
2022-04-11 04:11:47 +00:00
tri[5][0].data = write_varint49(5);
for(; C < tri[7][0].data.length/2; ++C) {
dv.setUint16(C*2, 0xFFFF, true);
2022-04-11 04:11:47 +00:00
/*if(!wide)*/ _dv.setUint16(C*2, 0xFFFF, true);
}
tri[6][0].data = u8concat(cell_storage);
2022-04-11 04:11:47 +00:00
/*if(!wide)*/ tri[3][0].data = u8concat(_cell_storage);
tri[8] = [{type: 0, data: write_varint49(wide ? 1 : 0)}];
return cnt;
}
2022-04-11 04:11:47 +00:00
/** Write IWA Message */
2022-03-25 00:12:55 +00:00
function write_iwam(type: number, payload: Uint8Array): IWAMessage {
return {
meta: [ [],
[ { type: 0, data: write_varint49(type) } ],
// [ { type: 2, data: new Uint8Array([1, 0, 5]) }]
],
2022-03-25 00:12:55 +00:00
data: payload
};
}
type Dependents = {[x:number]: DependentInfo; last?: number;};
2022-04-11 04:11:47 +00:00
function get_unique_msgid(dep: DependentInfo, dependents: Dependents) {
if(!dependents.last) dependents.last = 927262;
for(var i = dependents.last; i < 2000000; ++i) if(!dependents[i]) {
dependents[dependents.last = i] = dep;
return i;
}
throw new Error("Too many messages");
}
/** Build an approximate dependency tree */
function build_numbers_deps(cfb: CFB$Container): Dependents {
var dependents: Dependents = {};
var indices: number[] = [];
cfb.FileIndex.map((fi, idx): [CFB$Entry, string] => ([fi, cfb.FullPaths[idx]])).forEach(row => {
var fi = row[0], fp = row[1];
if(fi.type != 2) return;
if(!fi.name.match(/\.iwa/)) return;
if(fi.name.match(/OperationStorage/)) return;
parse_iwa_file(decompress_iwa_file(fi.content as Uint8Array)).forEach(packet => {
indices.push(packet.id);
dependents[packet.id] = { deps: [], location: fp, type: varint_to_i32(packet.messages[0].meta[1][0].data) };
});
});
2022-04-11 04:11:47 +00:00
/* precompute a varint for each id */
indices.sort((x,y) => x-y);
var indices_varint: Array<[number, Uint8Array]> = indices.filter(x => x > 1).map(x => [x, write_varint49(x)] );
2022-04-11 04:11:47 +00:00
/* build dependent tree */
cfb.FileIndex.forEach(fi => {
if(!fi.name.match(/\.iwa/)) return;
if(fi.name.match(/OperationStorage/)) return;
parse_iwa_file(decompress_iwa_file(fi.content as Uint8Array)).forEach(ia => {
// this is a huge hack based on the observation that most messages of interest have id > 900000
// TODO: use the actual references
2022-04-14 07:27:38 +00:00
indices_varint.forEach(ivi => {
if(ia.messages.some(mess => varint_to_i32(mess.meta[1][0].data) != 11006 && u8contains(mess.data, ivi[1]))) {
dependents[ivi[0]].deps.push(ia.id);
}
});
});
});
return dependents;
}
/** Write NUMBERS workbook */
function write_numbers_iwa(wb: WorkBook, opts?: WritingOptions): CFB$Container {
if(!opts || !opts.numbers) throw new Error("Must pass a `numbers` option -- check the README");
/* read template and build packet metadata */
var cfb: CFB$Container = CFB.read(opts.numbers, { type: "base64" });
var dependents: Dependents = build_numbers_deps(cfb);
/* .TN.DocumentArchive */
var cfb_DA = CFB.find(cfb, dependents[1].location);
if(!cfb_DA) throw `Could not find ${dependents[1].location} in Numbers template`;
var iwa_DA = parse_iwa_file(decompress_iwa_file(cfb_DA.content as Uint8Array));
var docroot: IWAArchiveInfo = iwa_DA.find(packet => packet.id == 1) as IWAArchiveInfo;
2022-07-08 22:31:08 +00:00
if(docroot == null) throw `Could not find message ${1} in Numbers template`;
var sheetrefs = mappa(parse_shallow(docroot.messages[0].data)[1], parse_TSP_Reference);
wb.SheetNames.forEach((name, idx) => write_numbers_ws(cfb, dependents, wb.Sheets[name], name, idx, sheetrefs[idx]));
return cfb;
}
/** Find a particular message by ID, perform actions and commit */
function numbers_iwa_doit(cfb: CFB$Container, deps: Dependents, id: number, cb:(ai:IWAArchiveInfo, x:IWAArchiveInfo[])=>void) {
var entry = CFB.find(cfb, deps[id].location);
if(!entry) throw `Could not find ${deps[id].location} in Numbers template`;
var x = parse_iwa_file(decompress_iwa_file(entry.content as Uint8Array));
var ainfo: IWAArchiveInfo = x.find(packet => packet.id == id) as IWAArchiveInfo;
// TODO: it's assumed this exists
cb(ainfo, x);
entry.content = compress_iwa_file(write_iwa_file(x)); entry.size = entry.content.length;
}
/** Find a particular message by ID */
function numbers_iwa_find(cfb: CFB$Container, deps: Dependents, id: number) {
var entry = CFB.find(cfb, deps[id].location);
if(!entry) throw `Could not find ${deps[id].location} in Numbers template`;
var x = parse_iwa_file(decompress_iwa_file(entry.content as Uint8Array));
var ainfo: IWAArchiveInfo = x.find(packet => packet.id == id) as IWAArchiveInfo;
// TODO: it's assumed this exists
return ainfo;
}
/** Write NUMBERS worksheet */
function write_numbers_ws(cfb: CFB$Container, deps: Dependents, ws: WorkSheet, wsname: string, sheetidx: number, rootref: number): void {
/* TODO: support multiple worksheets, larger ranges, more data types, etc */
if(sheetidx >= 1) return console.error("The Numbers writer currently writes only the first table");
/* .TN.SheetArchive */
var drawables: number[] = [];
numbers_iwa_doit(cfb, deps, rootref, (docroot) => {
var sheetref = parse_shallow(docroot.messages[0].data);
{
/* write worksheet name */
sheetref[1] = [ { type: 2, data: stru8(wsname) }];
drawables = mappa(sheetref[2], parse_TSP_Reference);
}
docroot.messages[0].data = write_shallow(sheetref);
});
2022-03-26 21:50:27 +00:00
/* .TST.TableInfoArchive */
// TODO: verify that the first entry is actually a table
// TODO: eventually support multiple tables (and replicate in QPW)
var tia: IWAArchiveInfo = numbers_iwa_find(cfb, deps, drawables[0]);
/* .TST.TableModelArchive */
var tmaref = parse_TSP_Reference(parse_shallow(tia.messages[0].data)[2][0].data);
numbers_iwa_doit(cfb, deps, tmaref, (docroot, x) => write_numbers_tma(cfb, deps, ws, docroot, x, tmaref));
}
2022-03-25 00:12:55 +00:00
var USE_WIDE_ROWS = true;
/** Write .TST.TableModelArchive */
function write_numbers_tma(cfb: CFB$Container, deps: Dependents, ws, tmaroot: IWAArchiveInfo, tmafile: IWAArchiveInfo[], tmaref: number) {
var range = decode_range(ws["!ref"] as string);
range.s.r = range.s.c = 0;
var trunc = false;
2022-09-21 22:16:57 +00:00
/* Actual NUMBERS 12.1 range limit ALL1000000 */
if(range.e.c > 999) { trunc = true; range.e.c = 999; }
if(range.e.r > 999999) { trunc = true; range.e.r = 999999; }
2022-09-21 22:16:57 +00:00
if(trunc) console.error(`Truncating to ${encode_range(range)}`);
/* preprocess data and build up shared string table */
var data = sheet_to_json<any>(ws, { range, header: 1 });
2022-09-21 22:16:57 +00:00
var SST = ["~Sh33tJ5~"], SST_set = new Set(SST);
data.forEach(row => row.forEach(cell => { if(typeof cell == "string" && !SST_set.has(cell)) { SST.push(cell); SST_set.add(cell); } }));
/* identifier for finding the TableModelArchive in the archive */
var loc = deps[tmaref].location;
loc = loc.replace(/^Root Entry\//,""); // NOTE: the Root Entry prefix is an artifact of the CFB container library
loc = loc.replace(/^Index\//, "").replace(/\.iwa$/,"");
var pb = parse_shallow(tmaroot.messages[0].data);
2022-03-25 00:12:55 +00:00
{
pb[6][0].data = write_varint49(range.e.r + 1); // number_of_rows
pb[7][0].data = write_varint49(range.e.c + 1); // number_of_columns
// pb[22] = [ { type: 0, data: write_varint49(1) } ]; // displays table name in sheet
delete pb[46]; // base_column_row_uids -- deleting forces Numbers to refresh cell table
/* .TST.DataStore */
2022-03-25 00:12:55 +00:00
var store = parse_shallow(pb[4][0].data);
{
/* rewrite row headers */
var row_header_ref = parse_TSP_Reference(parse_shallow(store[1][0].data)[2][0].data);
numbers_iwa_doit(cfb, deps, row_header_ref, (rowhead, _x) => {
var base_bucket = parse_shallow(rowhead.messages[0].data);
if(base_bucket?.[2]?.[0]) for(var R = 0; R < data.length; ++R) {
var _bucket = parse_shallow(base_bucket[2][0].data);
_bucket[1][0].data = write_varint49(R);
_bucket[4][0].data = write_varint49(data[R].length);
base_bucket[2][R] = { type: base_bucket[2][0].type, data: write_shallow(_bucket) };
}
rowhead.messages[0].data = write_shallow(base_bucket);
});
/* rewrite col headers */
var col_header_ref = parse_TSP_Reference(store[2][0].data);
numbers_iwa_doit(cfb, deps, col_header_ref, (colhead, _x) => {
var base_bucket = parse_shallow(colhead.messages[0].data);
for(var C = 0; C <= range.e.c; ++C) {
var _bucket = parse_shallow(base_bucket[2][0].data);
_bucket[1][0].data = write_varint49(C);
_bucket[4][0].data = write_varint49(range.e.r + 1);
base_bucket[2][C] = { type: base_bucket[2][0].type, data: write_shallow(_bucket) };
}
colhead.messages[0].data = write_shallow(base_bucket);
});
/* rebuild shared string table */
var sstref = parse_TSP_Reference(store[4][0].data);
numbers_iwa_doit(cfb, deps, sstref, (sstroot) => {
var sstdata = parse_shallow(sstroot.messages[0].data);
{
sstdata[3] = [];
SST.forEach((str, i) => {
sstdata[3].push({type: 2, data: write_shallow([ [],
[ { type: 0, data: write_varint49(i) } ],
[ { type: 0, data: write_varint49(1) } ],
[ { type: 2, data: stru8(str) } ]
])});
});
}
sstroot.messages[0].data = write_shallow(sstdata);
});
var rbtree = parse_shallow(store[9][0].data);
rbtree[1] = [];
/* .TST.TileStorage */
var tilestore = parse_shallow(store[3][0].data);
{
/* number of rows per tile */
var tstride = 256; // NOTE: if this is not 256, Numbers will recalculate
tilestore[2] = [{type: 0, data: write_varint49(tstride)}];
//tilestore[3] = [{type: 0, data: write_varint49(USE_WIDE_ROWS ? 1 : 0)}]; // elicits a modification message
var tileref = parse_TSP_Reference(parse_shallow(tilestore[1][0].data)[2][0].data);
var save_token = 0;
/* remove existing tile */
{
CFB.utils.cfb_del(cfb, deps[tileref].location);
/* remove existing tile from reference -- TODO: can this have an id other than 2? */
numbers_iwa_doit(cfb, deps, 2, (ai => {
var mlist = parse_shallow(ai.messages[0].data);
var lst = mlist[3].filter(m => parse_varint49(parse_shallow(m.data)[1][0].data) == tileref);
if(lst && lst.length > 0) save_token = parse_varint49(parse_shallow(lst[0].data)[12][0].data);
mlist[3] = mlist[3].filter(m => parse_varint49(parse_shallow(m.data)[1][0].data) != tileref);
/* remove reference from TableModelArchive file to Tile */
var parentidx = mlist[3].findIndex(m => {
var mm = parse_shallow(m.data);
if(mm[3]?.[0]) return u8str(mm[3][0].data) == loc;
if(mm[2]?.[0] && u8str(mm[2][0].data) == loc) return true;
return false;
});
var parent = parse_shallow(mlist[3][parentidx].data);
if(!parent[6]) parent[6] = [];
parent[6] = parent[6].filter(m => parse_varint49(parse_shallow(m.data)[1][0].data) != tileref);
mlist[3][parentidx].data = write_shallow(parent);
ai.messages[0].data = write_shallow(mlist);
}));
}
/* rewrite entire tile storage */
tilestore[1] = [] as ProtoField;
var ntiles = Math.ceil((range.e.r + 1)/tstride);
for(var tidx = 0; tidx < ntiles; ++tidx) {
var newtileid = get_unique_msgid({
deps: [], // TODO: probably should update this
location: "",
type: 6002
}, deps);
deps[newtileid].location = `Root Entry/Index/Tables/Tile-${newtileid}.iwa`;
/* create new tile */
var tiledata: ProtoMessage = [
[],
[{type: 0, data: write_varint49(0 /*range.e.c + 1*/)}],
[{type: 0, data: write_varint49(Math.min(range.e.r + 1, (tidx + 1) * tstride))}],
[{type: 0, data: write_varint49(0/*cnt*/)}],
[{type: 0, data: write_varint49(Math.min((tidx+1)*tstride,range.e.r+1) - tidx * tstride)}],
[],
[{type: 0, data: write_varint49(5)}],
[{type: 0, data: write_varint49(1)}],
[{type: 0, data: write_varint49(USE_WIDE_ROWS ? 1 : 0)}]
];
for(var R = tidx * tstride; R <= Math.min(range.e.r, (tidx + 1) * tstride - 1); ++R) {
var tilerow: ProtoMessage = [
[],
[ { type: 0, data: write_varint49(0) }],
[ { type: 0, data: write_varint49(0) }],
[ { type: 2, data: new Uint8Array([]) }],
[ { type: 2, data: new Uint8Array(Array.from({length:510}, () => 255)) }],
[ { type: 0, data: write_varint49(5) }],
[ { type: 2, data: new Uint8Array([]) }],
[ { type: 2, data: new Uint8Array(Array.from({length:510}, () => 255)) }],
[ { type: 0, data: write_varint49(1) }],
] as ProtoMessage;
write_tile_row(tilerow, data[R], SST, USE_WIDE_ROWS);
tilerow[1][0].data = write_varint49(R - tidx * tstride);
tiledata[5].push({data: write_shallow(tilerow), type: 2});
}
/* add to tiles */
tilestore[1].push({type: 2, data: write_shallow([
[],
[{type: 0, data: write_varint49(tidx)}],
[{type: 2, data: write_TSP_Reference(newtileid)}]
])});
/* add to file */
var newtile: IWAArchiveInfo = {
id: newtileid,
messages: [ write_iwam(6002, write_shallow(tiledata))]
};
var tilecontent = compress_iwa_file(write_iwa_file([newtile]));
CFB.utils.cfb_add(cfb, `/Index/Tables/Tile-${newtileid}.iwa`, tilecontent);
/* update metadata -- TODO: can this have an id other than 2? */
numbers_iwa_doit(cfb, deps, 2, (ai => {
var mlist = parse_shallow(ai.messages[0].data);
mlist[3].push({type: 2, data: write_shallow([
[],
[{type: 0, data: write_varint49(newtileid)}],
[{type: 2, data: stru8("Tables/Tile") }],
[{type: 2, data: stru8(`Tables/Tile-${newtileid}`)}],
[{type: 2, data: new Uint8Array([2, 0, 0])}],
[{type: 2, data: new Uint8Array([2, 0, 0])}],
[],
[],
[],
[],
[{type: 0, data: write_varint49(0)}],
[],
[{type: 0, data: write_varint49(save_token)}],
])});
mlist[1] = [{type: 0, data: write_varint49(Math.max(newtileid + 1, parse_varint49(mlist[1][0].data) ))}];
/* add reference from TableModelArchive file to Tile */
var parentidx = mlist[3].findIndex(m => {
var mm = parse_shallow(m.data);
if(mm[3]?.[0]) return u8str(mm[3][0].data) == loc;
if(mm[2]?.[0] && u8str(mm[2][0].data) == loc) return true;
return false;
2022-09-21 22:16:57 +00:00
});
var parent = parse_shallow(mlist[3][parentidx].data);
if(!parent[6]) parent[6] = [];
parent[6].push({
type: 2,
data: write_shallow([
[],
[{type: 0, data: write_varint49(newtileid) }]
])
});
mlist[3][parentidx].data = write_shallow(parent);
ai.messages[0].data = write_shallow(mlist);
}));
/* add to TableModelArchive object references */
var orefs: number[] = tmaroot.messages[0].meta[5]?.[0] ? parse_packed_varints(tmaroot.messages[0].meta[5][0].data) : [];
var orefidx = orefs.indexOf(newtileid);
if(orefidx == -1) {
orefs[orefidx = orefs.length] = newtileid;
tmaroot.messages[0].meta[5] =[ {type: 2, data: write_packed_varints(orefs) }];
}
/* add to row rbtree */
rbtree[1].push({type: 2, data: write_shallow([
[],
[{ type: 0, data: write_varint49(tidx*tstride) }],
[{ type: 0, data: write_varint49(tidx) }]
])});
}
}
store[3][0].data = write_shallow(tilestore);
store[9][0].data = write_shallow(rbtree);
store[10] = [ { type: 2, data: new Uint8Array([]) }];
/* write merge list */
2022-03-25 00:12:55 +00:00
if(ws["!merges"]) {
var mergeid = get_unique_msgid({
type: 6144,
deps: [tmaref],
location: deps[tmaref].location
}, deps);
tmafile.push({
2022-03-25 00:12:55 +00:00
id: mergeid,
2022-09-21 22:16:57 +00:00
messages: [ write_iwam(6144, write_shallow([ [],
ws["!merges"].map((m: Range) => ({type: 2, data: write_shallow([ [],
[{ type: 2, data: write_shallow([ [],
[{ type: 5, data: new Uint8Array(new Uint16Array([m.s.r, m.s.c]).buffer) }],
])}],
[{ type: 2, data: write_shallow([ [],
[{ type: 5, data: new Uint8Array(new Uint16Array([m.e.r - m.s.r + 1, m.e.c - m.s.c + 1]).buffer) }],
]) }]
])} as ProtoItem))
])) ]
} as IWAArchiveInfo);
store[13] = [ { type: 2, data: write_TSP_Reference(mergeid) } ];
2022-03-25 00:12:55 +00:00
numbers_iwa_doit(cfb, deps, 2, (ai => {
var mlist = parse_shallow(ai.messages[0].data);
/* add reference from TableModelArchive file to merge */
var parentidx = mlist[3].findIndex(m => {
var mm = parse_shallow(m.data);
if(mm[3]?.[0]) return u8str(mm[3][0].data) == loc;
if(mm[2]?.[0] && u8str(mm[2][0].data) == loc) return true;
return false;
});
var parent = parse_shallow(mlist[3][parentidx].data);
if(!parent[6]) parent[6] = [];
parent[6].push({
type: 2,
data: write_shallow([
[],
[{type: 0, data: write_varint49(mergeid) }]
])
});
mlist[3][parentidx].data = write_shallow(parent);
2022-03-25 00:12:55 +00:00
ai.messages[0].data = write_shallow(mlist);
}));
2022-03-25 00:12:55 +00:00
/* add object reference from TableModelArchive */
/* var*/ orefs /*: number[]*/ = tmaroot.messages[0].meta[5]?.[0] ? parse_packed_varints(tmaroot.messages[0].meta[5][0].data) : [];
/* var*/ orefidx = orefs.indexOf(mergeid);
if(orefidx == -1) {
orefs[orefidx = orefs.length] = mergeid;
tmaroot.messages[0].meta[5] =[ {type: 2, data: write_packed_varints(orefs) }];
2022-03-25 00:12:55 +00:00
}
} else delete store[13]; // TODO: delete references to merge if not needed
2022-03-25 00:12:55 +00:00
}
pb[4][0].data = write_shallow(store);
}
tmaroot.messages[0].data = write_shallow(pb);
}