forked from sheetjs/sheetjs
SheetJS
e59de73f99
- XLS normalize URLs and use moniker (fixes #2385) - ODS row heights and column widths (fixes #2378) - DSV parse of files with leading <, deviating from Excel (fixes #1238) - read `ArrayBuffer` with no type (fixes #2316) - removed invalid test files that throw errors due to string length - AOA/JSON null optional map to #NULL! (fixes #1196)
632 lines
23 KiB
JavaScript
632 lines
23 KiB
JavaScript
/* [MS-DTYP] 2.3.3 FILETIME */
|
|
/* [MS-OLEDS] 2.1.3 FILETIME (Packet Version) */
|
|
/* [MS-OLEPS] 2.8 FILETIME (Packet Version) */
|
|
function parse_FILETIME(blob) {
|
|
var dwLowDateTime = blob.read_shift(4), dwHighDateTime = blob.read_shift(4);
|
|
return new Date(((dwHighDateTime/1e7*Math.pow(2,32) + dwLowDateTime/1e7) - 11644473600)*1000).toISOString().replace(/\.000/,"");
|
|
}
|
|
function write_FILETIME(time/*:string|Date*/) {
|
|
var date = (typeof time == "string") ? new Date(Date.parse(time)) : time;
|
|
var t = date.getTime() / 1000 + 11644473600;
|
|
var l = t % Math.pow(2,32), h = (t - l) / Math.pow(2,32);
|
|
l *= 1e7; h *= 1e7;
|
|
var w = (l / Math.pow(2,32)) | 0;
|
|
if(w > 0) { l = l % Math.pow(2,32); h += w; }
|
|
var o = new_buf(8); o.write_shift(4, l); o.write_shift(4, h); return o;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.4 Lpstr */
|
|
function parse_lpstr(blob, type, pad/*:?number*/) {
|
|
var start = blob.l;
|
|
var str = blob.read_shift(0, 'lpstr-cp');
|
|
if(pad) while((blob.l - start) & 3) ++blob.l;
|
|
return str;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.6 Lpwstr */
|
|
function parse_lpwstr(blob, type, pad) {
|
|
var str = blob.read_shift(0, 'lpwstr');
|
|
if(pad) blob.l += (4 - ((str.length+1) & 3)) & 3;
|
|
return str;
|
|
}
|
|
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.11 VtString */
|
|
/* [MS-OSHARED] 2.3.3.1.12 VtUnalignedString */
|
|
function parse_VtStringBase(blob, stringType, pad) {
|
|
if(stringType === 0x1F /*VT_LPWSTR*/) return parse_lpwstr(blob);
|
|
return parse_lpstr(blob, stringType, pad);
|
|
}
|
|
|
|
function parse_VtString(blob, t/*:number*/, pad/*:?boolean*/) { return parse_VtStringBase(blob, t, pad === false ? 0: 4); }
|
|
function parse_VtUnalignedString(blob, t/*:number*/) { if(!t) throw new Error("VtUnalignedString must have positive length"); return parse_VtStringBase(blob, t, 0); }
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.9 VtVecUnalignedLpstrValue */
|
|
function parse_VtVecUnalignedLpstrValue(blob)/*:Array<string>*/ {
|
|
var length = blob.read_shift(4);
|
|
var ret/*:Array<string>*/ = [];
|
|
for(var i = 0; i != length; ++i) ret[i] = blob.read_shift(0, 'lpstr-cp').replace(chr0,'');
|
|
return ret;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.10 VtVecUnalignedLpstr */
|
|
function parse_VtVecUnalignedLpstr(blob)/*:Array<string>*/ {
|
|
return parse_VtVecUnalignedLpstrValue(blob);
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.13 VtHeadingPair */
|
|
function parse_VtHeadingPair(blob) {
|
|
var headingString = parse_TypedPropertyValue(blob, VT_USTR);
|
|
var headerParts = parse_TypedPropertyValue(blob, VT_I4);
|
|
return [headingString, headerParts];
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.14 VtVecHeadingPairValue */
|
|
function parse_VtVecHeadingPairValue(blob) {
|
|
var cElements = blob.read_shift(4);
|
|
var out = [];
|
|
for(var i = 0; i != cElements / 2; ++i) out.push(parse_VtHeadingPair(blob));
|
|
return out;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.3.1.15 VtVecHeadingPair */
|
|
function parse_VtVecHeadingPair(blob) {
|
|
// NOTE: When invoked, wType & padding were already consumed
|
|
return parse_VtVecHeadingPairValue(blob);
|
|
}
|
|
|
|
/* [MS-OLEPS] 2.18.1 Dictionary (uses 2.17, 2.16) */
|
|
function parse_dictionary(blob,CodePage) {
|
|
var cnt = blob.read_shift(4);
|
|
var dict/*:{[number]:string}*/ = ({}/*:any*/);
|
|
for(var j = 0; j != cnt; ++j) {
|
|
var pid = blob.read_shift(4);
|
|
var len = blob.read_shift(4);
|
|
dict[pid] = blob.read_shift(len, (CodePage === 0x4B0 ?'utf16le':'utf8')).replace(chr0,'').replace(chr1,'!');
|
|
if(CodePage === 0x4B0 && (len % 2)) blob.l += 2;
|
|
}
|
|
if(blob.l & 3) blob.l = (blob.l>>2+1)<<2;
|
|
return dict;
|
|
}
|
|
|
|
/* [MS-OLEPS] 2.9 BLOB */
|
|
function parse_BLOB(blob) {
|
|
var size = blob.read_shift(4);
|
|
var bytes = blob.slice(blob.l,blob.l+size);
|
|
blob.l += size;
|
|
if((size & 3) > 0) blob.l += (4 - (size & 3)) & 3;
|
|
return bytes;
|
|
}
|
|
|
|
/* [MS-OLEPS] 2.11 ClipboardData */
|
|
function parse_ClipboardData(blob) {
|
|
// TODO
|
|
var o = {};
|
|
o.Size = blob.read_shift(4);
|
|
//o.Format = blob.read_shift(4);
|
|
blob.l += o.Size + 3 - (o.Size - 1) % 4;
|
|
return o;
|
|
}
|
|
|
|
/* [MS-OLEPS] 2.15 TypedPropertyValue */
|
|
function parse_TypedPropertyValue(blob, type/*:number*/, _opts)/*:any*/ {
|
|
var t = blob.read_shift(2), ret, opts = _opts||{};
|
|
blob.l += 2;
|
|
if(type !== VT_VARIANT)
|
|
if(t !== type && VT_CUSTOM.indexOf(type)===-1) throw new Error('Expected type ' + type + ' saw ' + t);
|
|
switch(type === VT_VARIANT ? t : type) {
|
|
case 0x02 /*VT_I2*/: ret = blob.read_shift(2, 'i'); if(!opts.raw) blob.l += 2; return ret;
|
|
case 0x03 /*VT_I4*/: ret = blob.read_shift(4, 'i'); return ret;
|
|
case 0x0B /*VT_BOOL*/: return blob.read_shift(4) !== 0x0;
|
|
case 0x13 /*VT_UI4*/: ret = blob.read_shift(4); return ret;
|
|
case 0x1E /*VT_LPSTR*/: return parse_lpstr(blob, t, 4).replace(chr0,'');
|
|
case 0x1F /*VT_LPWSTR*/: return parse_lpwstr(blob);
|
|
case 0x40 /*VT_FILETIME*/: return parse_FILETIME(blob);
|
|
case 0x41 /*VT_BLOB*/: return parse_BLOB(blob);
|
|
case 0x47 /*VT_CF*/: return parse_ClipboardData(blob);
|
|
case 0x50 /*VT_STRING*/: return parse_VtString(blob, t, !opts.raw).replace(chr0,'');
|
|
case 0x51 /*VT_USTR*/: return parse_VtUnalignedString(blob, t/*, 4*/).replace(chr0,'');
|
|
case 0x100C /*VT_VECTOR|VT_VARIANT*/: return parse_VtVecHeadingPair(blob);
|
|
case 0x101E /*VT_LPSTR*/: return parse_VtVecUnalignedLpstr(blob);
|
|
default: throw new Error("TypedPropertyValue unrecognized type " + type + " " + t);
|
|
}
|
|
}
|
|
function write_TypedPropertyValue(type/*:number*/, value) {
|
|
var o = new_buf(4), p = new_buf(4);
|
|
o.write_shift(4, type == 0x50 ? 0x1F : type);
|
|
switch(type) {
|
|
case 0x03 /*VT_I4*/: p.write_shift(-4, value); break;
|
|
case 0x05 /*VT_I4*/: p = new_buf(8); p.write_shift(8, value, 'f'); break;
|
|
case 0x0B /*VT_BOOL*/: p.write_shift(4, value ? 0x01 : 0x00); break;
|
|
case 0x40 /*VT_FILETIME*/: /*:: if(typeof value !== "string" && !(value instanceof Date)) throw "unreachable"; */ p = write_FILETIME(value); break;
|
|
case 0x1F /*VT_LPWSTR*/:
|
|
case 0x50 /*VT_STRING*/:
|
|
/*:: if(typeof value !== "string") throw "unreachable"; */
|
|
p = new_buf(4 + 2 * (value.length + 1) + (value.length % 2 ? 0 : 2));
|
|
p.write_shift(4, value.length + 1);
|
|
p.write_shift(0, value, "dbcs");
|
|
while(p.l != p.length) p.write_shift(1, 0);
|
|
break;
|
|
default: throw new Error("TypedPropertyValue unrecognized type " + type + " " + value);
|
|
}
|
|
return bconcat([o, p]);
|
|
}
|
|
|
|
/* [MS-OLEPS] 2.20 PropertySet */
|
|
function parse_PropertySet(blob, PIDSI) {
|
|
var start_addr = blob.l;
|
|
var size = blob.read_shift(4);
|
|
var NumProps = blob.read_shift(4);
|
|
var Props = [], i = 0;
|
|
var CodePage = 0;
|
|
var Dictionary = -1, DictObj/*:{[number]:string}*/ = ({}/*:any*/);
|
|
for(i = 0; i != NumProps; ++i) {
|
|
var PropID = blob.read_shift(4);
|
|
var Offset = blob.read_shift(4);
|
|
Props[i] = [PropID, Offset + start_addr];
|
|
}
|
|
Props.sort(function(x,y) { return x[1] - y[1]; });
|
|
var PropH = {};
|
|
for(i = 0; i != NumProps; ++i) {
|
|
if(blob.l !== Props[i][1]) {
|
|
var fail = true;
|
|
if(i>0 && PIDSI) switch(PIDSI[Props[i-1][0]].t) {
|
|
case 0x02 /*VT_I2*/: if(blob.l+2 === Props[i][1]) { blob.l+=2; fail = false; } break;
|
|
case 0x50 /*VT_STRING*/: if(blob.l <= Props[i][1]) { blob.l=Props[i][1]; fail = false; } break;
|
|
case 0x100C /*VT_VECTOR|VT_VARIANT*/: if(blob.l <= Props[i][1]) { blob.l=Props[i][1]; fail = false; } break;
|
|
}
|
|
if((!PIDSI||i==0) && blob.l <= Props[i][1]) { fail=false; blob.l = Props[i][1]; }
|
|
if(fail) throw new Error("Read Error: Expected address " + Props[i][1] + ' at ' + blob.l + ' :' + i);
|
|
}
|
|
if(PIDSI) {
|
|
var piddsi = PIDSI[Props[i][0]];
|
|
PropH[piddsi.n] = parse_TypedPropertyValue(blob, piddsi.t, {raw:true});
|
|
if(piddsi.p === 'version') PropH[piddsi.n] = String(PropH[piddsi.n] >> 16) + "." + ("0000" + String(PropH[piddsi.n] & 0xFFFF)).slice(-4);
|
|
if(piddsi.n == "CodePage") switch(PropH[piddsi.n]) {
|
|
case 0: PropH[piddsi.n] = 1252;
|
|
/* falls through */
|
|
case 874:
|
|
case 932:
|
|
case 936:
|
|
case 949:
|
|
case 950:
|
|
case 1250:
|
|
case 1251:
|
|
case 1253:
|
|
case 1254:
|
|
case 1255:
|
|
case 1256:
|
|
case 1257:
|
|
case 1258:
|
|
case 10000:
|
|
case 1200:
|
|
case 1201:
|
|
case 1252:
|
|
case 65000: case -536:
|
|
case 65001: case -535:
|
|
set_cp(CodePage = (PropH[piddsi.n]>>>0) & 0xFFFF); break;
|
|
default: throw new Error("Unsupported CodePage: " + PropH[piddsi.n]);
|
|
}
|
|
} else {
|
|
if(Props[i][0] === 0x1) {
|
|
CodePage = PropH.CodePage = (parse_TypedPropertyValue(blob, VT_I2)/*:number*/);
|
|
set_cp(CodePage);
|
|
if(Dictionary !== -1) {
|
|
var oldpos = blob.l;
|
|
blob.l = Props[Dictionary][1];
|
|
DictObj = parse_dictionary(blob,CodePage);
|
|
blob.l = oldpos;
|
|
}
|
|
} else if(Props[i][0] === 0) {
|
|
if(CodePage === 0) { Dictionary = i; blob.l = Props[i+1][1]; continue; }
|
|
DictObj = parse_dictionary(blob,CodePage);
|
|
} else {
|
|
var name = DictObj[Props[i][0]];
|
|
var val;
|
|
/* [MS-OSHARED] 2.3.3.2.3.1.2 + PROPVARIANT */
|
|
switch(blob[blob.l]) {
|
|
case 0x41 /*VT_BLOB*/: blob.l += 4; val = parse_BLOB(blob); break;
|
|
case 0x1E /*VT_LPSTR*/: blob.l += 4; val = parse_VtString(blob, blob[blob.l-4]).replace(/\u0000+$/,""); break;
|
|
case 0x1F /*VT_LPWSTR*/: blob.l += 4; val = parse_VtString(blob, blob[blob.l-4]).replace(/\u0000+$/,""); break;
|
|
case 0x03 /*VT_I4*/: blob.l += 4; val = blob.read_shift(4, 'i'); break;
|
|
case 0x13 /*VT_UI4*/: blob.l += 4; val = blob.read_shift(4); break;
|
|
case 0x05 /*VT_R8*/: blob.l += 4; val = blob.read_shift(8, 'f'); break;
|
|
case 0x0B /*VT_BOOL*/: blob.l += 4; val = parsebool(blob, 4); break;
|
|
case 0x40 /*VT_FILETIME*/: blob.l += 4; val = parseDate(parse_FILETIME(blob)); break;
|
|
default: throw new Error("unparsed value: " + blob[blob.l]);
|
|
}
|
|
PropH[name] = val;
|
|
}
|
|
}
|
|
}
|
|
blob.l = start_addr + size; /* step ahead to skip padding */
|
|
return PropH;
|
|
}
|
|
var XLSPSSkip = [ "CodePage", "Thumbnail", "_PID_LINKBASE", "_PID_HLINKS", "SystemIdentifier", "FMTID" ].concat(PseudoPropsPairs);
|
|
function guess_property_type(val/*:any*/)/*:number*/ {
|
|
switch(typeof val) {
|
|
case "boolean": return 0x0B;
|
|
case "number": return ((val|0)==val) ? 0x03 : 0x05;
|
|
case "string": return 0x1F;
|
|
case "object": if(val instanceof Date) return 0x40; break;
|
|
}
|
|
return -1;
|
|
}
|
|
function write_PropertySet(entries, RE, PIDSI) {
|
|
var hdr = new_buf(8), piao = [], prop = [];
|
|
var sz = 8, i = 0;
|
|
|
|
var pr = new_buf(8), pio = new_buf(8);
|
|
pr.write_shift(4, 0x0002);
|
|
pr.write_shift(4, 0x04B0);
|
|
pio.write_shift(4, 0x0001);
|
|
prop.push(pr); piao.push(pio);
|
|
sz += 8 + pr.length;
|
|
|
|
if(!RE) {
|
|
pio = new_buf(8);
|
|
pio.write_shift(4, 0);
|
|
piao.unshift(pio);
|
|
|
|
var bufs = [new_buf(4)];
|
|
bufs[0].write_shift(4, entries.length);
|
|
for(i = 0; i < entries.length; ++i) {
|
|
var value = entries[i][0];
|
|
pr = new_buf(4 + 4 + 2 * (value.length + 1) + (value.length % 2 ? 0 : 2));
|
|
pr.write_shift(4, i+2);
|
|
pr.write_shift(4, value.length + 1);
|
|
pr.write_shift(0, value, "dbcs");
|
|
while(pr.l != pr.length) pr.write_shift(1, 0);
|
|
bufs.push(pr);
|
|
}
|
|
pr = bconcat(bufs);
|
|
prop.unshift(pr);
|
|
sz += 8 + pr.length;
|
|
}
|
|
|
|
for(i = 0; i < entries.length; ++i) {
|
|
if(RE && !RE[entries[i][0]]) continue;
|
|
if(XLSPSSkip.indexOf(entries[i][0]) > -1) continue;
|
|
if(entries[i][1] == null) continue;
|
|
|
|
var val = entries[i][1], idx = 0;
|
|
if(RE) {
|
|
idx = +RE[entries[i][0]];
|
|
var pinfo = (PIDSI/*:: || {}*/)[idx]/*:: || {} */;
|
|
if(pinfo.p == "version" && typeof val == "string") {
|
|
/*:: if(typeof val !== "string") throw "unreachable"; */
|
|
var arr = val.split(".");
|
|
val = ((+arr[0])<<16) + ((+arr[1])||0);
|
|
}
|
|
pr = write_TypedPropertyValue(pinfo.t, val);
|
|
} else {
|
|
var T = guess_property_type(val);
|
|
if(T == -1) { T = 0x1F; val = String(val); }
|
|
pr = write_TypedPropertyValue(T, val);
|
|
}
|
|
prop.push(pr);
|
|
|
|
pio = new_buf(8);
|
|
pio.write_shift(4, !RE ? 2+i : idx);
|
|
piao.push(pio);
|
|
|
|
sz += 8 + pr.length;
|
|
}
|
|
|
|
var w = 8 * (prop.length + 1);
|
|
for(i = 0; i < prop.length; ++i) { piao[i].write_shift(4, w); w += prop[i].length; }
|
|
hdr.write_shift(4, sz);
|
|
hdr.write_shift(4, prop.length);
|
|
return bconcat([hdr].concat(piao).concat(prop));
|
|
}
|
|
|
|
/* [MS-OLEPS] 2.21 PropertySetStream */
|
|
function parse_PropertySetStream(file, PIDSI, clsid) {
|
|
var blob = file.content;
|
|
if(!blob) return ({}/*:any*/);
|
|
prep_blob(blob, 0);
|
|
|
|
var NumSets, FMTID0, FMTID1, Offset0, Offset1 = 0;
|
|
blob.chk('feff', 'Byte Order: ');
|
|
|
|
/*var vers = */blob.read_shift(2); // TODO: check version
|
|
var SystemIdentifier = blob.read_shift(4);
|
|
var CLSID = blob.read_shift(16);
|
|
if(CLSID !== CFB.utils.consts.HEADER_CLSID && CLSID !== clsid) throw new Error("Bad PropertySet CLSID " + CLSID);
|
|
NumSets = blob.read_shift(4);
|
|
if(NumSets !== 1 && NumSets !== 2) throw new Error("Unrecognized #Sets: " + NumSets);
|
|
FMTID0 = blob.read_shift(16); Offset0 = blob.read_shift(4);
|
|
|
|
if(NumSets === 1 && Offset0 !== blob.l) throw new Error("Length mismatch: " + Offset0 + " !== " + blob.l);
|
|
else if(NumSets === 2) { FMTID1 = blob.read_shift(16); Offset1 = blob.read_shift(4); }
|
|
var PSet0 = parse_PropertySet(blob, PIDSI);
|
|
|
|
var rval = ({ SystemIdentifier: SystemIdentifier }/*:any*/);
|
|
for(var y in PSet0) rval[y] = PSet0[y];
|
|
//rval.blob = blob;
|
|
rval.FMTID = FMTID0;
|
|
//rval.PSet0 = PSet0;
|
|
if(NumSets === 1) return rval;
|
|
if(Offset1 - blob.l == 2) blob.l += 2;
|
|
if(blob.l !== Offset1) throw new Error("Length mismatch 2: " + blob.l + " !== " + Offset1);
|
|
var PSet1;
|
|
try { PSet1 = parse_PropertySet(blob, null); } catch(e) {/* empty */}
|
|
for(y in PSet1) rval[y] = PSet1[y];
|
|
rval.FMTID = [FMTID0, FMTID1]; // TODO: verify FMTID0/1
|
|
return rval;
|
|
}
|
|
function write_PropertySetStream(entries, clsid, RE, PIDSI/*:{[key:string|number]:any}*/, entries2/*:?any*/, clsid2/*:?any*/) {
|
|
var hdr = new_buf(entries2 ? 68 : 48);
|
|
var bufs = [hdr];
|
|
hdr.write_shift(2, 0xFFFE);
|
|
hdr.write_shift(2, 0x0000); /* TODO: type 1 props */
|
|
hdr.write_shift(4, 0x32363237);
|
|
hdr.write_shift(16, CFB.utils.consts.HEADER_CLSID, "hex");
|
|
hdr.write_shift(4, (entries2 ? 2 : 1));
|
|
hdr.write_shift(16, clsid, "hex");
|
|
hdr.write_shift(4, (entries2 ? 68 : 48));
|
|
var ps0 = write_PropertySet(entries, RE, PIDSI);
|
|
bufs.push(ps0);
|
|
|
|
if(entries2) {
|
|
var ps1 = write_PropertySet(entries2, null, null);
|
|
hdr.write_shift(16, clsid2, "hex");
|
|
hdr.write_shift(4, 68 + ps0.length);
|
|
bufs.push(ps1);
|
|
}
|
|
return bconcat(bufs);
|
|
}
|
|
|
|
function parsenoop2(blob, length) { blob.read_shift(length); return null; }
|
|
function writezeroes(n, o) { if(!o) o=new_buf(n); for(var j=0; j<n; ++j) o.write_shift(1, 0); return o; }
|
|
|
|
function parslurp(blob, length, cb) {
|
|
var arr = [], target = blob.l + length;
|
|
while(blob.l < target) arr.push(cb(blob, target - blob.l));
|
|
if(target !== blob.l) throw new Error("Slurp error");
|
|
return arr;
|
|
}
|
|
|
|
function parsebool(blob, length/*:number*/) { return blob.read_shift(length) === 0x1; }
|
|
function writebool(v/*:any*/, o) { if(!o) o=new_buf(2); o.write_shift(2, +!!v); return o; }
|
|
|
|
function parseuint16(blob/*::, length:?number, opts:?any*/) { return blob.read_shift(2, 'u'); }
|
|
function writeuint16(v/*:number*/, o) { if(!o) o=new_buf(2); o.write_shift(2, v); return o; }
|
|
function parseuint16a(blob, length/*:: :?number, opts:?any*/) { return parslurp(blob,length,parseuint16);}
|
|
|
|
/* --- 2.5 Structures --- */
|
|
|
|
/* [MS-XLS] 2.5.10 Bes (boolean or error) */
|
|
function parse_Bes(blob/*::, length*/) {
|
|
var v = blob.read_shift(1), t = blob.read_shift(1);
|
|
return t === 0x01 ? v : v === 0x01;
|
|
}
|
|
function write_Bes(v, t/*:string*/, o) {
|
|
if(!o) o = new_buf(2);
|
|
o.write_shift(1, ((t == 'e') ? +v : +!!v));
|
|
o.write_shift(1, ((t == 'e') ? 1 : 0));
|
|
return o;
|
|
}
|
|
|
|
/* [MS-XLS] 2.5.240 ShortXLUnicodeString */
|
|
function parse_ShortXLUnicodeString(blob, length, opts) {
|
|
var cch = blob.read_shift(opts && opts.biff >= 12 ? 2 : 1);
|
|
var encoding = 'sbcs-cont';
|
|
var cp = current_codepage;
|
|
if(opts && opts.biff >= 8) current_codepage = 1200;
|
|
if(!opts || opts.biff == 8 ) {
|
|
var fHighByte = blob.read_shift(1);
|
|
if(fHighByte) { encoding = 'dbcs-cont'; }
|
|
} else if(opts.biff == 12) {
|
|
encoding = 'wstr';
|
|
}
|
|
if(opts.biff >= 2 && opts.biff <= 5) encoding = 'cpstr';
|
|
var o = cch ? blob.read_shift(cch, encoding) : "";
|
|
current_codepage = cp;
|
|
return o;
|
|
}
|
|
|
|
/* 2.5.293 XLUnicodeRichExtendedString */
|
|
function parse_XLUnicodeRichExtendedString(blob) {
|
|
var cp = current_codepage;
|
|
current_codepage = 1200;
|
|
var cch = blob.read_shift(2), flags = blob.read_shift(1);
|
|
var /*fHighByte = flags & 0x1,*/ fExtSt = flags & 0x4, fRichSt = flags & 0x8;
|
|
var width = 1 + (flags & 0x1); // 0x0 -> utf8, 0x1 -> dbcs
|
|
var cRun = 0, cbExtRst;
|
|
var z = {};
|
|
if(fRichSt) cRun = blob.read_shift(2);
|
|
if(fExtSt) cbExtRst = blob.read_shift(4);
|
|
var encoding = width == 2 ? 'dbcs-cont' : 'sbcs-cont';
|
|
var msg = cch === 0 ? "" : blob.read_shift(cch, encoding);
|
|
if(fRichSt) blob.l += 4 * cRun; //TODO: parse this
|
|
if(fExtSt) blob.l += cbExtRst; //TODO: parse this
|
|
z.t = msg;
|
|
if(!fRichSt) { z.raw = "<t>" + z.t + "</t>"; z.r = z.t; }
|
|
current_codepage = cp;
|
|
return z;
|
|
}
|
|
function write_XLUnicodeRichExtendedString(xlstr/*:: :XLString, opts*/) {
|
|
var str = (xlstr.t||""), nfmts = 1;
|
|
|
|
var hdr = new_buf(3 + (nfmts > 1 ? 2 : 0));
|
|
hdr.write_shift(2, str.length);
|
|
hdr.write_shift(1, (nfmts > 1 ? 0x08 : 0x00) | 0x01);
|
|
if(nfmts > 1) hdr.write_shift(2, nfmts);
|
|
|
|
var otext = new_buf(2 * str.length);
|
|
otext.write_shift(2 * str.length, str, 'utf16le');
|
|
|
|
var out = [hdr, otext];
|
|
|
|
return bconcat(out);
|
|
}
|
|
|
|
/* 2.5.296 XLUnicodeStringNoCch */
|
|
function parse_XLUnicodeStringNoCch(blob, cch, opts) {
|
|
var retval;
|
|
if(opts) {
|
|
if(opts.biff >= 2 && opts.biff <= 5) return blob.read_shift(cch, 'cpstr');
|
|
if(opts.biff >= 12) return blob.read_shift(cch, 'dbcs-cont');
|
|
}
|
|
var fHighByte = blob.read_shift(1);
|
|
if(fHighByte===0) { retval = blob.read_shift(cch, 'sbcs-cont'); }
|
|
else { retval = blob.read_shift(cch, 'dbcs-cont'); }
|
|
return retval;
|
|
}
|
|
|
|
/* 2.5.294 XLUnicodeString */
|
|
function parse_XLUnicodeString(blob, length, opts) {
|
|
var cch = blob.read_shift(opts && opts.biff == 2 ? 1 : 2);
|
|
if(cch === 0) { blob.l++; return ""; }
|
|
return parse_XLUnicodeStringNoCch(blob, cch, opts);
|
|
}
|
|
/* BIFF5 override */
|
|
function parse_XLUnicodeString2(blob, length, opts) {
|
|
if(opts.biff > 5) return parse_XLUnicodeString(blob, length, opts);
|
|
var cch = blob.read_shift(1);
|
|
if(cch === 0) { blob.l++; return ""; }
|
|
return blob.read_shift(cch, (opts.biff <= 4 || !blob.lens ) ? 'cpstr' : 'sbcs-cont');
|
|
}
|
|
/* TODO: BIFF5 and lower, codepage awareness */
|
|
function write_XLUnicodeString(str, opts, o) {
|
|
if(!o) o = new_buf(3 + 2 * str.length);
|
|
o.write_shift(2, str.length);
|
|
o.write_shift(1, 1);
|
|
o.write_shift(31, str, 'utf16le');
|
|
return o;
|
|
}
|
|
|
|
/* [MS-XLS] 2.5.61 ControlInfo */
|
|
function parse_ControlInfo(blob/*::, length, opts*/) {
|
|
var flags = blob.read_shift(1);
|
|
blob.l++;
|
|
var accel = blob.read_shift(2);
|
|
blob.l += 2;
|
|
return [flags, accel];
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.7.6 URLMoniker TODO: flags */
|
|
function parse_URLMoniker(blob/*::, length, opts*/) {
|
|
var len = blob.read_shift(4), start = blob.l;
|
|
var extra = false;
|
|
if(len > 24) {
|
|
/* look ahead */
|
|
blob.l += len - 24;
|
|
if(blob.read_shift(16) === "795881f43b1d7f48af2c825dc4852763") extra = true;
|
|
blob.l = start;
|
|
}
|
|
var url = blob.read_shift((extra?len-24:len)>>1, 'utf16le').replace(chr0,"");
|
|
if(extra) blob.l += 24;
|
|
return url;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.7.8 FileMoniker TODO: all fields */
|
|
function parse_FileMoniker(blob/*::, length*/) {
|
|
var cAnti = blob.read_shift(2);
|
|
var preamble = ""; while(cAnti-- > 0) preamble += "../";
|
|
var ansiPath = blob.read_shift(0, 'lpstr-ansi');
|
|
blob.l += 2; //var endServer = blob.read_shift(2);
|
|
if(blob.read_shift(2) != 0xDEAD) throw new Error("Bad FileMoniker");
|
|
var sz = blob.read_shift(4);
|
|
if(sz === 0) return preamble + ansiPath.replace(/\\/g,"/");
|
|
var bytes = blob.read_shift(4);
|
|
if(blob.read_shift(2) != 3) throw new Error("Bad FileMoniker");
|
|
var unicodePath = blob.read_shift(bytes>>1, 'utf16le').replace(chr0,"");
|
|
return preamble + unicodePath;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.7.2 HyperlinkMoniker TODO: all the monikers */
|
|
function parse_HyperlinkMoniker(blob, length) {
|
|
var clsid = blob.read_shift(16); length -= 16;
|
|
switch(clsid) {
|
|
case "e0c9ea79f9bace118c8200aa004ba90b": return parse_URLMoniker(blob, length);
|
|
case "0303000000000000c000000000000046": return parse_FileMoniker(blob, length);
|
|
default: throw new Error("Unsupported Moniker " + clsid);
|
|
}
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.7.9 HyperlinkString */
|
|
function parse_HyperlinkString(blob/*::, length*/) {
|
|
var len = blob.read_shift(4);
|
|
var o = len > 0 ? blob.read_shift(len, 'utf16le').replace(chr0, "") : "";
|
|
return o;
|
|
}
|
|
function write_HyperlinkString(str/*:string*/, o) {
|
|
if(!o) o = new_buf(6 + str.length * 2);
|
|
o.write_shift(4, 1 + str.length);
|
|
for(var i = 0; i < str.length; ++i) o.write_shift(2, str.charCodeAt(i));
|
|
o.write_shift(2, 0);
|
|
return o;
|
|
}
|
|
|
|
/* [MS-OSHARED] 2.3.7.1 Hyperlink Object */
|
|
function parse_Hyperlink(blob, length)/*:Hyperlink*/ {
|
|
var end = blob.l + length;
|
|
var sVer = blob.read_shift(4);
|
|
if(sVer !== 2) throw new Error("Unrecognized streamVersion: " + sVer);
|
|
var flags = blob.read_shift(2);
|
|
blob.l += 2;
|
|
var displayName, targetFrameName, moniker, oleMoniker, Loc="", guid, fileTime;
|
|
if(flags & 0x0010) displayName = parse_HyperlinkString(blob, end - blob.l);
|
|
if(flags & 0x0080) targetFrameName = parse_HyperlinkString(blob, end - blob.l);
|
|
if((flags & 0x0101) === 0x0101) moniker = parse_HyperlinkString(blob, end - blob.l);
|
|
if((flags & 0x0101) === 0x0001) oleMoniker = parse_HyperlinkMoniker(blob, end - blob.l);
|
|
if(flags & 0x0008) Loc = parse_HyperlinkString(blob, end - blob.l);
|
|
if(flags & 0x0020) guid = blob.read_shift(16);
|
|
if(flags & 0x0040) fileTime = parse_FILETIME(blob/*, 8*/);
|
|
blob.l = end;
|
|
var target = targetFrameName||moniker||oleMoniker||"";
|
|
if(target && Loc) target+="#"+Loc;
|
|
if(!target) target = "#" + Loc;
|
|
if((flags & 0x0002) && target.charAt(0) == "/" && target.charAt(1) != "/") target = "file://" + target;
|
|
var out = ({Target:target}/*:any*/);
|
|
if(guid) out.guid = guid;
|
|
if(fileTime) out.time = fileTime;
|
|
if(displayName) out.Tooltip = displayName;
|
|
return out;
|
|
}
|
|
function write_Hyperlink(hl) {
|
|
var out = new_buf(512), i = 0;
|
|
var Target = hl.Target;
|
|
if(Target.slice(0,7) == "file://") Target = Target.slice(7);
|
|
var hashidx = Target.indexOf("#");
|
|
var F = hashidx > -1 ? 0x1f : 0x17;
|
|
switch(Target.charAt(0)) { case "#": F=0x1c; break; case ".": F&=~2; break; }
|
|
out.write_shift(4,2); out.write_shift(4, F);
|
|
var data = [8,6815827,6619237,4849780,83]; for(i = 0; i < data.length; ++i) out.write_shift(4, data[i]);
|
|
if(F == 0x1C) {
|
|
Target = Target.slice(1);
|
|
write_HyperlinkString(Target, out);
|
|
} else if(F & 0x02) {
|
|
data = "e0 c9 ea 79 f9 ba ce 11 8c 82 00 aa 00 4b a9 0b".split(" ");
|
|
for(i = 0; i < data.length; ++i) out.write_shift(1, parseInt(data[i], 16));
|
|
var Pretarget = hashidx > -1 ? Target.slice(0, hashidx) : Target;
|
|
out.write_shift(4, 2*(Pretarget.length + 1));
|
|
for(i = 0; i < Pretarget.length; ++i) out.write_shift(2, Pretarget.charCodeAt(i));
|
|
out.write_shift(2, 0);
|
|
if(F & 0x08) write_HyperlinkString(hashidx > -1 ? Target.slice(hashidx+1): "", out);
|
|
} else {
|
|
data = "03 03 00 00 00 00 00 00 c0 00 00 00 00 00 00 46".split(" ");
|
|
for(i = 0; i < data.length; ++i) out.write_shift(1, parseInt(data[i], 16));
|
|
var P = 0;
|
|
while(Target.slice(P*3,P*3+3)=="../"||Target.slice(P*3,P*3+3)=="..\\") ++P;
|
|
out.write_shift(2, P);
|
|
out.write_shift(4, Target.length - 3 * P + 1);
|
|
for(i = 0; i < Target.length - 3 * P; ++i) out.write_shift(1, Target.charCodeAt(i + 3 * P) & 0xFF);
|
|
out.write_shift(1, 0);
|
|
out.write_shift(2, 0xFFFF);
|
|
out.write_shift(2, 0xDEAD);
|
|
for(i = 0; i < 6; ++i) out.write_shift(4, 0);
|
|
}
|
|
return out.slice(0, out.l);
|
|
}
|
|
|
|
/* 2.5.178 LongRGBA */
|
|
function parse_LongRGBA(blob/*::, length*/) { var r = blob.read_shift(1), g = blob.read_shift(1), b = blob.read_shift(1), a = blob.read_shift(1); return [r,g,b,a]; }
|
|
|
|
/* 2.5.177 LongRGB */
|
|
function parse_LongRGB(blob, length) { var x = parse_LongRGBA(blob, length); x[3] = 0; return x; }
|
|
|
|
|