diff --git a/Makefile b/Makefile new file mode 100644 index 0000000..2045f80 --- /dev/null +++ b/Makefile @@ -0,0 +1,8 @@ +DEPS=$(wildcard bits/*.js) + +xlsx.js: $(DEPS) + cat $^ > $@ + +.PHONY: clean +clean: + rm xlsx.js diff --git a/bits/00_header.js b/bits/00_header.js new file mode 100644 index 0000000..83d0233 --- /dev/null +++ b/bits/00_header.js @@ -0,0 +1,2 @@ +/* vim: set ts=2: */ +/*jshint eqnull:true */ diff --git a/bits/10_ssf.js b/bits/10_ssf.js new file mode 100644 index 0000000..f973a22 --- /dev/null +++ b/bits/10_ssf.js @@ -0,0 +1,220 @@ +/* Spreadsheet Format -- jump to XLSX for the XLSX code */ +var SSF = (function() { + var SSF = {}; +String.prototype.reverse=function(){return this.split("").reverse().join("");}; +var _strrev = function(x) { return String(x).reverse(); }; +function fill(c,l) { return new Array(l+1).join(c); } +function pad(v,d){var t=String(v);return t.length>=d?t:(fill(0,d-t.length)+t);} +/* Options */ +var opts_fmt = {}; +function fixopts(o){for(y in opts_fmt) if(o[y]===undefined) o[y]=opts_fmt[y];} +SSF.opts = opts_fmt; +opts_fmt.date1904 = 0; +opts_fmt.output = "" +opts_fmt.mode = ""; +var table_fmt = { + 1: '0', + 2: '0.00', + 3: '#,##0', + 4: '#,##0.00', + 9: '0%', + 10: '0.00%', + 11: '0.00E+00', + 12: '# ?/?', + 13: '# ??/??', + 14: 'mm/dd/yy', + 15: 'd-mmm-yy', + 16: 'd-mmm', + 17: 'mmm-yy', + 18: 'h:mm AM/PM', + 19: 'h:mm:ss AM/PM', + 20: 'h:mm', + 21: 'h:mm:ss', + 22: 'm/d/yy h:mm', + 37: '#,##0 ;(#,##0)', + 38: '#,##0 ;[Red](#,##0)', + 39: '#,##0.00;(#,##0.00)', + 40: '#,##0.00;[Red](#,##0.00)', + 45: 'mm:ss', + 46: '[h]:mm:ss', + 47: 'mmss.0', + 48: '##0.0E+0', + 49: '@' +}; +var days = [ + ['Sun', 'Sunday'], + ['Mon', 'Monday'], + ['Tue', 'Tuesday'], + ['Wed', 'Wednesday'], + ['Thu', 'Thursday'], + ['Fri', 'Friday'], + ['Sat', 'Saturday'] +]; +var months = [ + ['J', 'Jan', 'January'], + ['F', 'Feb', 'February'], + ['M', 'Mar', 'March'], + ['A', 'Apr', 'April'], + ['M', 'May', 'May'], + ['J', 'Jun', 'June'], + ['J', 'Jul', 'July'], + ['A', 'Aug', 'August'], + ['S', 'Sep', 'September'], + ['O', 'Oct', 'October'], + ['N', 'Nov', 'November'], + ['D', 'Dec', 'December'], +]; +var general_fmt = function(v) { + if(typeof v === 'boolean') return v ? "TRUE" : "FALSE"; +} +SSF._general = general_fmt; +var parse_date_code = function parse_date_code(v,opts) { + var date = Math.floor(v), time = Math.round(86400 * (v - date)), dow=0; + var dout=[], out={D:date, T:time}; fixopts(opts = (opts||{})); + if(opts.date1904) date += 1462; + if(date === 60) dout = [1900,2,29], dow=3; + else { + if(date > 60) --date; + /* 1 = Jan 1 1900 */ + var d = new Date(1900,0,1); + d.setDate(d.getDate() + date - 1); + dout = [d.getFullYear(), d.getMonth()+1,d.getDate()]; + dow = d.getDay(); + if(opts.mode === 'excel' && date < 60) dow = (dow + 6) % 7; + } + out.y = dout[0], out.m = dout[1], out.d = dout[2]; + out.S = time % 60; time = Math.floor(time / 60); + out.M = time % 60; time = Math.floor(time / 60); + out.H = time; + out.q = dow; + return out; +}; +SSF.parse_date_code = parse_date_code; +var write_date = function(type, fmt, val) { + switch(type) { + case 'y': switch(fmt) { /* year */ + case 'y': case 'yy': return pad(val.y % 100,2); + default: return val.y; + }; break; + case 'm': switch(fmt) { /* month */ + case 'm': return val.m; + case 'mm': return pad(val.m,2); + case 'mmm': return months[val.m-1][1]; + case 'mmmm': return months[val.m-1][2]; + case 'mmmmm': return months[val.m-1][0]; + default: throw 'bad month format: ' + fmt; + }; break; + case 'd': switch(fmt) { /* day */ + case 'd': return val.d; + case 'dd': return pad(val.d,2); + case 'ddd': return days[val.q][0]; + case 'dddd': return days[val.q][1]; + default: throw 'bad day format: ' + fmt; + }; break; + case 'h': switch(fmt) { /* 12-hour */ + case 'h': return 1+(val.H+11)%12; + case 'hh': return pad(1+(val.H+11)%12, 2); + default: throw 'bad hour format: ' + fmt; + }; break; + case 'H': switch(fmt) { /* 24-hour */ + case 'h': return val.H; + case 'hh': return pad(val.H, 2); + default: throw 'bad hour format: ' + fmt; + }; break; + case 'M': switch(fmt) { /* minutes */ + case 'm': return val.M; + case 'mm': return pad(val.M, 2); + default: throw 'bad minute format: ' + fmt; + }; break; + case 's': switch(fmt) { /* seconds */ + case 's': return val.S; + case 'ss': return pad(val.S, 2); + default: throw 'bad second format: ' + fmt; + }; break; + case 'A': return (val.h>=12 ? 'P' : 'A') + fmt.substr(1); + default: throw 'bad format type ' + type + ' in ' + fmt; + } +}; +function split_fmt(fmt) { + return fmt.reverse().split(/;(?!\\)/).reverse().map(_strrev); +} +SSF._split = split_fmt; +function eval_fmt(fmt, v, opts) { + var out = [], o = "", i = 0, c = "", lst='t', q = {}, dt; + fixopts(opts = (opts || {})); + var hr='H' + /* Tokenize */ + while(i < fmt.length) { + switch(c = fmt[i]) { + case '"': /* Literal text */ + for(o="";fmt[++i] !== '"';) o += fmt[(fmt[i] === '\\' ? ++i : i)]; + out.push({t:'t', v:o}); break; + case '\\': out.push({t:'t', v:fmt[++i]}); ++i; break; + case '@': /* Text Placeholder */ + out.push({t:'T', v:v}); ++i; break; + /* Dates */ + case 'm': case 'd': case 'y': case 'h': case 's': + if(!dt) dt = parse_date_code(v, opts); + o = fmt[i]; while(fmt[++i] === c) o+=c; + if(c === 'm' && lst.toLowerCase() === 'h') c = 'M'; /* m = minute */ + if(c === 'h') c = hr; + q={t:c, v:o}; out.push(q); lst = c; break; + case 'A': + q={t:c,v:"A"}; + if(fmt.substr(i, 3) === "A/P") hr = 'h',i+=3; + else if(fmt.substr(i,5) === "AM/PM") { q.v = "AM"; i+=5; hr = 'h' } + else q.t = "t"; + out.push(q); lst = c; break; + case '[': /* ignore all conditionals and formatting */ + while(fmt[i++] !== ']'); break; + default: + if("$-+/():!^&'~{}<>= ".indexOf(c) === -1) + throw 'unrecognized character ' + fmt[i] + ' in ' + fmt; + out.push({t:'t', v:c}); ++i; break; + } + } + /* walk backwards */ + for(i=out.length-1, lst='t'; i >= 0; --i) { + switch(out[i].t) { + case 'h': case 'H': out[i].t = hr; lst='h'; break; + case 'd': case 'y': case 's': case 'M': lst=out[i].t; break; + case 'm': if(lst === 's') out[i].t = 'M'; break; + + } + } + + /* replace fields */ + for(i=0; i < out.length; ++i) { + switch(out[i].t) { + case 't': case 'T': break; + case 'd': case 'm': case 'y': case 'h': case 'H': case 'M': case 's': case 'A': + out[i].v = write_date(out[i].t, out[i].v, dt); + out[i].t = 't'; break; + default: throw "unrecognized type " + out[i].t; + } + } + + return out.map(function(x){return x.v}).join(""); +} +SSF._eval = eval_fmt; +function choose_fmt(fmt, v) { + if(typeof fmt === "string") fmt = split_fmt(fmt); + if(!(typeof v === "number")) return fmt[3]; + return v > 0 ? fmt[0] : v < 0 ? fmt[1] : fmt[2]; +} + +var format = function format(fmt,v,o) { + fixopts(o = (o||{})); + if(fmt === 0) return general_fmt(v, o); + if(typeof fmt === 'number') fmt = table_fmt[fmt]; + var f = choose_fmt(fmt, v, o); + return eval_fmt(f, v, o); +} + +SSF._choose = choose_fmt; +SSF._table = table_fmt; +SSF.load = function(fmt, idx) { table_fmt[idx] = fmt; }; +SSF.format = format; + + return SSF; +})(); diff --git a/bits/70_xlsx.js b/bits/70_xlsx.js new file mode 100644 index 0000000..dade954 --- /dev/null +++ b/bits/70_xlsx.js @@ -0,0 +1,594 @@ + +var XLSX = (function(){ +var ct2type = { + "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet.main+xml": "workbooks", + "application/vnd.openxmlformats-package.core-properties+xml": "coreprops", + "application/vnd.openxmlformats-officedocument.extended-properties+xml": "extprops", + "application/vnd.openxmlformats-officedocument.spreadsheetml.calcChain+xml": "calcchains", + "application/vnd.openxmlformats-officedocument.spreadsheetml.worksheet+xml":"sheets", + "application/vnd.openxmlformats-officedocument.spreadsheetml.sharedStrings+xml": "strs", + "application/vnd.openxmlformats-officedocument.spreadsheetml.styles+xml":"styles", + "application/vnd.openxmlformats-officedocument.theme+xml":"themes", + "foo": "bar" +}; + +/* 18.2.28 (CT_WorkbookProtection) Defaults */ +var WBPropsDef = { + allowRefreshQuery: '0', + autoCompressPictures: '1', + backupFile: '0', + checkCompatibility: '0', + codeName: '', + date1904: '0', + dateCompatibility: '1', + //defaultThemeVersion: '0', + filterPrivacy: '0', + hidePivotFieldList: '0', + promptedSolutions: '0', + publishItems: '0', + refreshAllConnections: false, + saveExternalLinkValues: '1', + showBorderUnselectedTables: '1', + showInkAnnotation: '1', + showObjects: 'all', + showPivotChartFilter: '0' + //updateLinks: 'userSet' +}; + +/* 18.2.30 (CT_BookView) Defaults */ +var WBViewDef = { + activeTab: '0', + autoFilterDateGrouping: '1', + firstSheet: '0', + minimized: '0', + showHorizontalScroll: '1', + showSheetTabs: '1', + showVerticalScroll: '1', + tabRatio: '600', + visibility: 'visible' + //window{Height,Width}, {x,y}Window +}; + +/* 18.2.19 (CT_Sheet) Defaults */ +var SheetDef = { + state: 'visible' +}; + +/* 18.2.2 (CT_CalcPr) Defaults */ +var CalcPrDef = { + calcCompleted: 'true', + calcMode: 'auto', + calcOnSave: 'true', + concurrentCalc: 'true', + fullCalcOnLoad: 'false', + fullPrecision: 'true', + iterate: 'false', + iterateCount: '100', + iterateDelta: '0.001', + refMode: 'A1' +}; + +/* 18.2.3 (CT_CustomWorkbookView) Defaults */ +var CustomWBViewDef = { + autoUpdate: 'false', + changesSavedWin: 'false', + includeHiddenRowCol: 'true', + includePrintSettings: 'true', + maximized: 'false', + minimized: 'false', + onlySync: 'false', + personalView: 'false', + showComments: 'commIndicator', + showFormulaBar: 'true', + showHorizontalScroll: 'true', + showObjects: 'all', + showSheetTabs: 'true', + showStatusbar: 'true', + showVerticalScroll: 'true', + tabRatio: '600', + xWindow: '0', + yWindow: '0' +}; + +var XMLNS_CT = 'http://schemas.openxmlformats.org/package/2006/content-types'; +var XMLNS_WB = 'http://schemas.openxmlformats.org/spreadsheetml/2006/main'; + +var encodings = { + '"': '"', + ''': "'", + '>': '>', + '<': '<', + '&': '&' +}; + +// TODO: CP remap (need to read file version to determine OS) +function unescapexml(text){ + var s = text + ''; + for(var y in encodings) s = s.replace(new RegExp(y,'g'), encodings[y]); + return s.replace(/_x([0-9a-fA-F]*)_/g,function(m,c) {return _chr(parseInt(c,16));}); +} + +function parsexmltag(tag) { + var words = tag.split(/\s+/); + var z = {'0': words[0]}; + if(words.length === 1) return z; + tag.match(/(\w+)="([^"]*)"/g).map( + function(x){var y=x.match(/(\w+)="([^"]*)"/); z[y[1]] = y[2]; }); + return z; +} + + +var strs = {}; // shared strings +var styles = {}; // shared styles + + +/* 18.3 Worksheets */ +function parseSheet(data) { + /* 18.3.1.99 worksheet CT_Worksheet */ + var s = {}; + + /* 18.3.1.35 dimension CT_SheetDimension ? */ + var ref = data.match(//); + if(ref && ref.indexOf(":") !== -1) s["!ref"] = ref[1]; + + var refguess = {s: {r:1000000, c:1000000}, e: {r:0, c:0} }; + var q = ["v","f"]; + + /* 18.3.1.80 sheetData CT_SheetData ? */ + if(!data.match(//)) + data.match(/([^]*)<\/sheetData>/m)[1].split("").forEach(function(x) { + if(x === "" || x.trim() === "") return; + + /* 18.3.1.73 row CT_Row */ + var row = parsexmltag(x.match(/]*>/)[0]); + if(refguess.s.r > row.r - 1) refguess.s.r = row.r - 1; + if(refguess.e.r < row.r - 1) refguess.e.r = row.r - 1; + + /* 18.3.1.4 c CT_Cell */ + var cells = x.substr(x.indexOf('>')+1).split(/ idx - 1) refguess.s.c = idx - 1; + if(refguess.e.c < idx - 1) refguess.e.c = idx - 1; + var cell = parsexmltag((c.match(/]*>/)||[c])[0]); delete cell[0]; + var d = c.substr(c.indexOf('>')+1); + var p = {}; + q.forEach(function(f){var x=d.match(matchtag(f));if(x)p[f]=unescapexml(x[1]);}); + + /* SCHEMA IS ACTUALLY INCORRECT HERE. IF A CELL HAS NO T, EMIT "" */ + if(cell.t === undefined && p.v === undefined) { p.t = "str"; p.v = undefined; } + else p.t = (cell.t ? cell.t : "n"); // default is "n" in schema + switch(p.t) { + case 'n': p.v = parseFloat(p.v); break; + case 's': p.v = strs[parseInt(p.v, 10)].t; break; + case 'str': if(p.v) p.v = utf8read(p.v); break; // normal string + case 'inlineStr': + p.t = 'str'; p.v = unescapexml(d.match(matchtag('t'))[1]); + break; // inline string + case 'b': + switch(p.v) { + case '0': case 'FALSE': case "false": case false: p.v=false; break; + case '1': case 'TRUE': case "true": case true: p.v=true; break; + default: throw "Unrecognized boolean: " + p.v; + } break; + /* in case of error, stick value in .raw */ + case 'e': p.raw = p.v; p.v = undefined; break; + default: throw "Unrecognized cell type: " + p.t; + } + + /* formatting */ + if(cell.s) { + var cf = styles.CellXf[cell.s]; + if(cf && cf.numFmtId && cf.numFmtId != 0) { + p.raw = p.v; + p.rawt = p.t; + try { + p.v = SSF.format(cf.numFmtId,p.v); + p.t = 'str'; + } catch(e) { p.v = p.raw; } + } + } + + s[cell.r] = p; + }); + }); + if(!s["!ref"]) s["!ref"] = encode_range(refguess); + return s; +} + +// matches ... extracts content +function matchtag(f,g) {return new RegExp('<'+f+'(?: xml:space="preserve")?>([^]*)',(g||"")+"m");} + +function parseVector(data) { + var h = parsexmltag(data); + + var matches = data.match(new RegExp("(.*?)", 'g')); + if(matches.length != h.size) throw "unexpected vector length " + matches.length + " != " + h.size; + var res = []; + matches.forEach(function(x) { + var v = x.replace(/<[/]?vt:variant>/g,"").match(/]*)>(.*)191 && c<224) out += _chr((c & 31) << 6 | c2 & 63); + else { + c3 = orig.charCodeAt(i++); + out += _chr((c & 15) << 12 | (c2 & 63) << 6 | c3 & 63); + } + } + } + return out; +}; + +/* 18.4 Shared String Table */ +function parseStrs(data) { + var s = []; + var sst = data.match(new RegExp("]*)>([\\s\\S]*)<\/sst>","m")); + if(sst) { + s = sst[2].replace(//g,"").split(/<\/si>/).map(function(x) { var z = {}; + var y=x.match(/<(.*)>([\s\S]*)<\/.*/); if(y) z[y[1].split(" ")[0]]=utf8read(unescapexml(y[2])); return z;}); + + sst = parsexmltag(sst[1]); s.count = sst.count; s.uniqueCount = sst.uniqueCount; + } + return s; +} + +function parseProps(data) { + var p = { Company:'' }, q = {}; + var strings = ["Application", "DocSecurity", "Company", "AppVersion"]; + var bools = ["HyperlinksChanged","SharedDoc","LinksUpToDate","ScaleCrop"]; + var xtra = ["HeadingPairs", "TitlesOfParts"]; + var xtracp = ["category", "contentStatus", "lastModifiedBy", "lastPrinted", "revision", "version"]; + var xtradc = ["creator", "description", "identifier", "language", "subject", "title"]; + var xtradcterms = ["created", "modified"]; + xtra = xtra.concat(xtracp.map(function(x) { return "cp:" + x; })); + xtra = xtra.concat(xtradc.map(function(x) { return "dc:" + x; })); + xtra = xtra.concat(xtradcterms.map(function(x) { return "dcterms:" + x; })); + + + strings.forEach(function(f){p[f] = (data.match(matchtag(f))||[])[1];}); + bools.forEach(function(f){p[f] = (data.match(matchtag(f))||[])[1] == "true";}); + xtra.forEach(function(f) { + var cur = data.match(new RegExp("<" + f + "[^>]*>(.*)<\/" + f + ">")); + if(cur && cur.length > 0) q[f] = cur[1]; + }); + + if(q["HeadingPairs"] && q["TitlesOfParts"]) { + var v = parseVector(q["HeadingPairs"]); + var j = 0, widx = 0; + for(var i = 0; i !== v.length; ++i) { + switch(v[i].v) { + case "Worksheets": widx = j; p["Worksheets"] = +v[++i]; break; + case "Named Ranges": ++i; break; // TODO: Handle Named Ranges + default: console.error("Unrecognized key in Heading Pairs: " + v[i++].v); + } + } + var parts = parseVector(q["TitlesOfParts"]).map(utf8read); + p["SheetNames"] = parts.slice(widx, widx + p["Worksheets"]); + } + p["Creator"] = q["dc:creator"]; + p["LastModifiedBy"] = q["cp:lastModifiedBy"]; + p["CreatedDate"] = new Date(q["dcterms:created"]); + p["ModifiedDate"] = new Date(q["dcterms:modified"]); + return p; +} + +/* 18.6 Calculation Chain */ +function parseDeps(data) { + var d = []; + var l = 0, i = 1; + data.match(/<[^>]*>/g).forEach(function(x) { + var y = parsexmltag(x); + switch(y[0]) { + case '': case '': break; + /* 18.6.1 c CT_CalcCell 1 */ + case ']*>/g).forEach(function(x) { + var y = parsexmltag(x); + switch(y[0]) { + case ' 0 ? ct.calcchains[0] : ""; + ct.sst = ct.strs.length > 0 ? ct.strs[0] : ""; + ct.style = ct.styles.length > 0 ? ct.styles[0] : ""; + delete ct.calcchains; + return ct; +} + + +/* 18.2 Workbook */ +function parseWB(data) { + var wb = { AppVersion:{}, WBProps:{}, WBView:[], Sheets:[], CalcPr:{}, xmlns: "" }; + var pass = false; + data.match(/<[^>]*>/g).forEach(function(x) { + var y = parsexmltag(x); + switch(y[0]) { + case '': break; + + /* 18.2.13 fileVersion CT_FileVersion ? */ + case '': break; + + /* 18.2.12 fileSharing CT_FileSharing ? */ + case '': break; + + /* 18.2.28 workbookPr CT_WorkbookPr ? */ + case '': delete y[0]; wb.WBProps = y; break; + + /* 18.2.29 workbookProtection CT_WorkbookProtection ? */ + case '': break; + + /* 18.2.1 bookViews CT_BookViews ? */ + case '': case '': break; + /* 18.2.30 workbookView CT_BookView + */ + case '': case '': break; // aggregate sheet + /* 18.2.19 sheet CT_Sheet + */ + case '': break; + /* 18.2.14 functionGroup CT_FunctionGroup + */ + case '': break; + /* 18.2.8 externalReference CT_ExternalReference + */ + case '': break; + case '': pass=true; break; + case '': pass=false; break; + /* 18.2.5 definedName CT_DefinedName + */ + case '': case '': break; + + /* 18.2.2 calcPr CT_CalcPr ? */ + case '': delete y[0]; wb.CalcPr = y; break; + + /* 18.2.16 oleSize CT_OleSize ? (ref required) */ + case '': case '': case '': break; + + /* 18.2.18 pivotCaches CT_PivotCaches ? */ + case '': case '': case '': break; + + /* 18.2.23 smartTagTypes CT_SmartTagTypes ? */ + case '': case '': break; + /* 18.2.22 smartTagType CT_SmartTagType ? */ + case '': break; + + /* 18.2.11 fileRecoveryPr CT_FileRecoveryPr ? */ + case '': break; + + /* 18.2.26 webPublishObjects CT_WebPublishObjects ? */ + case '': case '': break; + /* 18.2.25 webPublishObject CT_WebPublishObject ? */ + case '': case '': case '': break; + /* 18.2.7 ext CT_Extension + */ + case '': pass=false; break; + + /* Others */ + case '': pass=false; break; + + default: if(!pass) console.error("WB Tag",x,y); + } + }); + if(wb.xmlns !== XMLNS_WB) throw "Unknown Namespace: " + wb.xmlns; + + var z; + /* defaults */ + for(z in WBPropsDef) if(null == wb.WBProps[z]) wb.WBProps[z] = WBPropsDef[z]; + for(z in CalcPrDef) if(null == wb.CalcPr[z]) wb.CalcPr[z] = CalcPrDef[z]; + + wb.WBView.forEach(function(w){for(var z in WBViewDef) if(null==w[z]) w[z]=WBViewDef[z]; }); + wb.Sheets.forEach(function(w){for(var z in SheetDef) if(null==w[z]) w[z]=SheetDef[z]; }); + + return wb; +} + +/* 18.8.31 numFmts CT_NumFmts */ +function parseNumFmts(t) { + styles.NumberFmt = []; + for(y in SSF._table) styles.NumberFmt[y] = SSF._table[y]; + t[0].match(/<[^>]*>/g).forEach(function(x) { + var y = parsexmltag(x); + switch(y[0]) { + case '': case '': break; + case ']*>/g).forEach(function(x) { + var y = parsexmltag(x); + switch(y[0]) { + case '': case '': break; + + /* 18.8.45 xf CT_Xf */ + case '': break; + + /* 18.8.1 alignment CT_CellAlignment */ + case '': break; + case ']*)>.*<\/numFmts>/)) parseNumFmts(t); + + /* fonts CT_Fonts ? */ + /* fills CT_Fills ? */ + /* borders CT_Borders ? */ + /* cellStyleXfs CT_CellStyleXfs ? */ + + /* cellXfs CT_CellXfs ? */ + if(t=data.match(/]*)>.*<\/cellXfs>/)) parseCXfs(t); + + /* dxfs CT_Dxfs ? */ + /* tableStyles CT_TableStyles ? */ + /* colors CT_Colors ? */ + /* extLst CT_ExtensionList ? */ + + return styles; +} + +function parseZip(zip) { + var entries = Object.keys(zip.files); + var keys = entries.filter(function(x){return x.substr(-1) != '/';}).sort(); + var dir = parseCT((zip.files['[Content_Types].xml']||{}).data); + + strs = {}; + if(dir.sst) strs=parseStrs(zip.files[dir.sst.replace(/^\//,'')].data); + + styles = {}; + if(dir.style) styles = parseStyles(zip.files[dir.style.replace(/^\//,'')].data); + + var wb = parseWB(zip.files[dir.workbooks[0].replace(/^\//,'')].data); + var propdata = dir.coreprops.length !== 0 ? zip.files[dir.coreprops[0].replace(/^\//,'')].data : ""; + propdata += dir.extprops.length !== 0 ? zip.files[dir.extprops[0].replace(/^\//,'')].data : ""; + var props = propdata !== "" ? parseProps(propdata) : {}; + var deps = {}; + if(dir.calcchain) deps=parseDeps(zip.files[dir.calcchain.replace(/^\//,'')].data); + var sheets = {}, i=0; + if(!props.Worksheets) { + /* Google Docs doesn't generate the appropriate metadata, so we impute: */ + var wbsheets = wb.Sheets; + props.Worksheets = wbsheets.length; + props.SheetNames = []; + for(var j = 0; j != wbsheets.length; ++j) { + props.SheetNames[j] = wbsheets[j].name; + } + for(i = 0; i != props.Worksheets; ++i) { + sheets[props.SheetNames[i]]=parseSheet(zip.files['xl/worksheets/sheet' + (i+1) + '.xml'].data); + } + } + else { + for(i = 0; i != props.Worksheets; ++i) { + sheets[props.SheetNames[i]]=parseSheet(zip.files[dir.sheets[i].replace(/^\//,'')].data); + } + } + return { + Directory: dir, + Workbook: wb, + Props: props, + Deps: deps, + Sheets: sheets, + SheetNames: props.SheetNames, + Strings: strs, + Styles: styles, + keys: keys, + files: zip.files + }; +} + +var _fs, jszip; +if(typeof JSZip !== "undefined") jszip = JSZip; +if (typeof exports !== 'undefined') { + if (typeof module !== 'undefined' && module.exports) { + if(typeof jszip === 'undefined') jszip = require('./jszip').JSZip; + _fs = require('fs'); + } +} + +function readSync(data, options) { + var zip, d = data; + var o = options||{}; + switch((o.type||"base64")){ + case "file": d = _fs.readFileSync(data).toString('base64'); + /* falls through */ + case "base64": zip = new jszip(d, { base64:true }); break; + case "binary": zip = new jszip(d, { base64:false }); break; + } + return parseZip(zip); +} + +function readFileSync(data, options) { + var o = options||{}; o.type = 'file'; + return readSync(data, o); +} + +this.read = readSync; +this.readFile = readFileSync; +this.parseZip = parseZip; +return this; + +})(); + diff --git a/bits/90_utils.js b/bits/90_utils.js new file mode 100644 index 0000000..ba05730 --- /dev/null +++ b/bits/90_utils.js @@ -0,0 +1,102 @@ +var _chr = function(c) { return String.fromCharCode(c); }; + +function encode_col(col) { var s=""; for(++col; col; col=Math.floor((col-1)/26)) s = _chr(((col-1)%26) + 65) + s; return s; } +function encode_row(row) { return "" + (row + 1); } +function encode_cell(cell) { return encode_col(cell.c) + encode_row(cell.r); } + +function decode_col(c) { var d = 0, i = 0; for(; i !== c.length; ++i) d = 26*d + c.charCodeAt(i) - 64; return d - 1; } +function decode_row(rowstr) { return Number(rowstr) - 1; } +function split_cell(cstr) { return cstr.replace(/(\$?[A-Z]*)(\$?[0-9]*)/,"$1,$2").split(","); } +function decode_cell(cstr) { var splt = split_cell(cstr); return { c:decode_col(splt[0]), r:decode_row(splt[1]) }; } +function decode_range(range) { var x =range.split(":").map(decode_cell); return {s:x[0],e:x[x.length-1]}; } +function encode_range(range) { return encode_cell(range.s) + ":" + encode_cell(range.e); } +/** + * Convert a sheet into an array of objects where the column headers are keys. + **/ +function sheet_to_row_object_array(sheet){ + var val, rowObject, range, columnHeaders, emptyRow, C; + var outSheet = []; + if (sheet["!ref"]) { + range = decode_range(sheet["!ref"]); + + columnHeaders = {}; + for (C = range.s.c; C <= range.e.c; ++C) { + val = sheet[encode_cell({ + c: C, + r: range.s.r + })]; + if(val){ + switch(val.t) { + case 's': case 'str': columnHeaders[C] = val.v; break; + case 'n': columnHeaders[C] = val.v; break; + } + } + } + + for (var R = range.s.r + 1; R <= range.e.r; ++R) { + emptyRow = true; + //Row number is recorded in the prototype + //so that it doesn't appear when stringified. + rowObject = Object.create({ __rowNum__ : R }); + for (C = range.s.c; C <= range.e.c; ++C) { + val = sheet[encode_cell({ + c: C, + r: R + })]; + if(val !== undefined) switch(val.t){ + case 's': case 'str': case 'b': case 'n': + if(val.v !== undefined) { + rowObject[columnHeaders[C]] = val.v; + emptyRow = false; + } + break; + case 'e': break; /* thorw */ + default: throw 'unrecognized type ' + val.t; + } + } + if(!emptyRow) { + outSheet.push(rowObject); + } + } + } + return outSheet; +} + +function sheet_to_csv(sheet) { + var stringify = function stringify(val) { + switch(val.t){ + case 'n': return val.v; + case 's': case 'str': return JSON.stringify(val.v); + case 'b': return val.v ? "TRUE" : "FALSE"; + case 'e': return ""; /* throw out value in case of error */ + default: throw 'unrecognized type ' + val.t; + } + }; + var out = ""; + if(sheet["!ref"]) { + var r = utils.decode_range(sheet["!ref"]); + for(var R = r.s.r; R <= r.e.r; ++R) { + var row = []; + for(var C = r.s.c; C <= r.e.c; ++C) { + var val = sheet[utils.encode_cell({c:C,r:R})]; + row.push(val ? stringify(val) : ""); + } + out += row.join(",") + "\n"; + } + } + return out; +} + +var utils = { + encode_col: encode_col, + encode_row: encode_row, + encode_cell: encode_cell, + encode_range: encode_range, + decode_col: decode_col, + decode_row: decode_row, + split_cell: split_cell, + decode_cell: decode_cell, + decode_range: decode_range, + sheet_to_csv: sheet_to_csv, + sheet_to_row_object_array: sheet_to_row_object_array +}; diff --git a/bits/99_footer.js b/bits/99_footer.js new file mode 100644 index 0000000..dd36528 --- /dev/null +++ b/bits/99_footer.js @@ -0,0 +1,12 @@ + +if(typeof require !== 'undefined' && typeof exports !== 'undefined') { + exports.read = XLSX.read; + exports.readFile = XLSX.readFile; + exports.utils = utils; + exports.main = function(args) { + var zip = XLSX.read(args[0], {type:'file'}); + console.log(zip.Sheets); + }; +if(typeof module !== 'undefined' && require.main === module) + exports.main(process.argv.slice(2)); +}